diff --git "a/8b7178b44b/3430925.out" "b/8b7178b44b/3430925.out" new file mode 100644--- /dev/null +++ "b/8b7178b44b/3430925.out" @@ -0,0 +1,51784 @@ +Model parameters: d_model 4096 ffw_size 16384 kv_size 128 n_heads 32 n_layers 42 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 2 --pipeline-model-parallel-size 2 --num-layers 42 --hidden-size 4096 --num-attention-heads 32 --kv-channels 128 --ffn-hidden-size 16384 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 1 --global-batch-size 512 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-8b7178b44bval --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 5000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_8b7178b44bval --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-8b7-178b-c4-repetitions/8b7178b44b --load lm1-8b7-178b-c4-repetitions/8b7178b44b --train-weighted-split-paths-path train400m.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --num-workers 0 --valid-num-workers 0 --deepspeed --deepspeed_config ds_configs/3430925.json --zero-stage 0 +START 3430925: Sat 29 Apr 2023 10:54:36 AM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 48.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== +52: +52: +52: ======================= ROCm System Management Interface ======================= +52: ================================= Concise Info ================================= +52: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +52: 0 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 1 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 2 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 6 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: ================================================================================ +52: ============================= End of ROCm SMI Log ============================== +53: +53: +53: ======================= ROCm System Management Interface ======================= +53: ================================= Concise Info ================================= +53: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +53: 0 44.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 2 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 6 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: ================================================================================ +53: ============================= End of ROCm SMI Log ============================== +62: +62: +62: ======================= ROCm System Management Interface ======================= +62: ================================= Concise Info ================================= +62: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +62: 0 48.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 2 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 4 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 6 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 7 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: ================================================================================ +62: ============================= End of ROCm SMI Log ============================== +55: +55: +55: ======================= ROCm System Management Interface ======================= +55: ================================= Concise Info ================================= +55: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +55: 0 53.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 2 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 4 51.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 6 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: ================================================================================ +55: ============================= End of ROCm SMI Log ============================== +57: +57: +57: ======================= ROCm System Management Interface ======================= +57: ================================= Concise Info ================================= +57: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +57: 0 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 2 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 4 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 6 44.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: ================================================================================ +57: ============================= End of ROCm SMI Log ============================== +58: +58: +58: ======================= ROCm System Management Interface ======================= +58: ================================= Concise Info ================================= +58: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +58: 0 49.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 2 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 4 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: ================================================================================ +58: ============================= End of ROCm SMI Log ============================== +63: +63: +63: ======================= ROCm System Management Interface ======================= +63: ================================= Concise Info ================================= +63: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +63: 0 45.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 2 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 4 38.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: ================================================================================ +63: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 45.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 39.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +41: +41: +41: ======================= ROCm System Management Interface ======================= +41: ================================= Concise Info ================================= +41: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +41: 0 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 4 48.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: ================================================================================ +41: ============================= End of ROCm SMI Log ============================== +39: +39: +39: ======================= ROCm System Management Interface ======================= +39: ================================= Concise Info ================================= +39: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +39: 0 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 2 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 4 39.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 5 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 6 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: ================================================================================ +39: ============================= End of ROCm SMI Log ============================== +50: +50: +50: ======================= ROCm System Management Interface ======================= +50: ================================= Concise Info ================================= +50: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +50: 0 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 4 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 6 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: ================================================================================ +50: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 44.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== +44: +44: +44: ======================= ROCm System Management Interface ======================= +44: ================================= Concise Info ================================= +44: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +44: 0 52.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 2 36.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 6 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: ================================================================================ +44: ============================= End of ROCm SMI Log ============================== +45: +45: +45: ======================= ROCm System Management Interface ======================= +45: ================================= Concise Info ================================= +45: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +45: 0 47.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 2 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 4 44.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 6 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: ================================================================================ +45: ============================= End of ROCm SMI Log ============================== +48: +48: +48: ======================= ROCm System Management Interface ======================= +48: ================================= Concise Info ================================= +48: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +48: 0 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 2 44.0c 79.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 4 46.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 6 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: ================================================================================ +48: ============================= End of ROCm SMI Log ============================== +37: +37: +37: ======================= ROCm System Management Interface ======================= +37: ================================= Concise Info ================================= +37: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +37: 0 46.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 2 41.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 4 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 6 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: ================================================================================ +37: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 51.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 51.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 43.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 50.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 48.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 46.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 46.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 36.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 39.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 40.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 44.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 42.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 46.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 49.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 38.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 47.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 51.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 40.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 40.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== +59: +59: +59: ======================= ROCm System Management Interface ======================= +59: ================================= Concise Info ================================= +59: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +59: 0 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 2 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 4 41.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 6 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: ================================================================================ +59: ============================= End of ROCm SMI Log ============================== +60: +60: +60: ======================= ROCm System Management Interface ======================= +60: ================================= Concise Info ================================= +60: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +60: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 2 37.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 4 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 6 37.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: ================================================================================ +60: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 38.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 41.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== +34: +34: +34: ======================= ROCm System Management Interface ======================= +34: ================================= Concise Info ================================= +34: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +34: 0 47.0c 100.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 2 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 4 47.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 6 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: ================================================================================ +34: ============================= End of ROCm SMI Log ============================== +42: +42: +42: ======================= ROCm System Management Interface ======================= +42: ================================= Concise Info ================================= +42: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +42: 0 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 2 37.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 4 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 6 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: ================================================================================ +42: ============================= End of ROCm SMI Log ============================== +35: +35: +35: ======================= ROCm System Management Interface ======================= +35: ================================= Concise Info ================================= +35: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +35: 0 48.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 2 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 4 42.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: ================================================================================ +35: ============================= End of ROCm SMI Log ============================== +40: +40: +40: ======================= ROCm System Management Interface ======================= +40: ================================= Concise Info ================================= +40: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +40: 0 51.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 4 45.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 6 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: ================================================================================ +40: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 48.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 40.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 41.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 37.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +36: +36: +36: ======================= ROCm System Management Interface ======================= +36: ================================= Concise Info ================================= +36: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +36: 0 47.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 2 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 4 47.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 6 45.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: ================================================================================ +36: ============================= End of ROCm SMI Log ============================== +49: +49: +49: ======================= ROCm System Management Interface ======================= +49: ================================= Concise Info ================================= +49: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +49: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 2 45.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 4 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 6 38.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: ================================================================================ +49: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 47.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 38.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 49.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 44.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 39.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 47.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 44.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 38.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 48.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 41.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 46.0c 78.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 49.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 47.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 46.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 42.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 49.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 47.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 43.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +33: +33: +33: ======================= ROCm System Management Interface ======================= +33: ================================= Concise Info ================================= +33: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +33: 0 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 2 46.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 6 47.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: ================================================================================ +33: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 48.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 47.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 49.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 43.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 46.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +43: +43: +43: ======================= ROCm System Management Interface ======================= +43: ================================= Concise Info ================================= +43: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +43: 0 50.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 2 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 4 34.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 6 41.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: ================================================================================ +43: ============================= End of ROCm SMI Log ============================== +38: +38: +38: ======================= ROCm System Management Interface ======================= +38: ================================= Concise Info ================================= +38: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +38: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 2 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 4 43.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 6 42.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: ================================================================================ +38: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +51: +51: +51: ======================= ROCm System Management Interface ======================= +51: ================================= Concise Info ================================= +51: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +51: 0 50.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 2 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 4 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 6 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: ================================================================================ +51: ============================= End of ROCm SMI Log ============================== +61: +61: +61: ======================= ROCm System Management Interface ======================= +61: ================================= Concise Info ================================= +61: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +61: 0 49.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 2 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 4 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 6 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: ================================================================================ +61: ============================= End of ROCm SMI Log ============================== +46: +46: +46: ======================= ROCm System Management Interface ======================= +46: ================================= Concise Info ================================= +46: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +46: 0 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 2 44.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 4 50.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 6 37.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 7 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: ================================================================================ +46: ============================= End of ROCm SMI Log ============================== +56: +56: +56: ======================= ROCm System Management Interface ======================= +56: ================================= Concise Info ================================= +56: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +56: 0 46.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 2 39.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 4 46.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 6 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 7 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: ================================================================================ +56: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 46.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 42.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 49.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 44.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +32: +32: +32: ======================= ROCm System Management Interface ======================= +32: ================================= Concise Info ================================= +32: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +32: 0 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 2 44.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 4 36.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 6 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: ================================================================================ +32: ============================= End of ROCm SMI Log ============================== +54: +54: +54: ======================= ROCm System Management Interface ======================= +54: ================================= Concise Info ================================= +54: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +54: 0 47.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 2 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 4 41.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 6 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: ================================================================================ +54: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 46.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 45.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 47.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 47.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 37.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 43.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +47: +47: +47: ======================= ROCm System Management Interface ======================= +47: ================================= Concise Info ================================= +47: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +47: 0 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 2 40.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 6 38.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: ================================================================================ +47: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 37.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +53: Launching on nid007016 (53/64), master nid006726 port 9999, GPUs 8, CUDA: True +45: Launching on nid007008 (45/64), master nid006726 port 9999, GPUs 8, CUDA: True +35: Launching on nid006998 (35/64), master nid006726 port 9999, GPUs 8, CUDA: True +36: Launching on nid006999 (36/64), master nid006726 port 9999, GPUs 8, CUDA: True +14: Launching on nid006740 (14/64), master nid006726 port 9999, GPUs 8, CUDA: True +49: Launching on nid007012 (49/64), master nid006726 port 9999, GPUs 8, CUDA: True +31: Launching on nid006757 (31/64), master nid006726 port 9999, GPUs 8, CUDA: True +63: Launching on nid007026 (63/64), master nid006726 port 9999, GPUs 8, CUDA: True +13: Launching on nid006739 (13/64), master nid006726 port 9999, GPUs 8, CUDA: True +39: Launching on nid007002 (39/64), master nid006726 port 9999, GPUs 8, CUDA: True +42: Launching on nid007005 (42/64), master nid006726 port 9999, GPUs 8, CUDA: True +58: Launching on nid007021 (58/64), master nid006726 port 9999, GPUs 8, CUDA: True +27: Launching on nid006753 (27/64), master nid006726 port 9999, GPUs 8, CUDA: True +23: Launching on nid006749 (23/64), master nid006726 port 9999, GPUs 8, CUDA: True + 6: Launching on nid006732 (6/64), master nid006726 port 9999, GPUs 8, CUDA: True +40: Launching on nid007003 (40/64), master nid006726 port 9999, GPUs 8, CUDA: True +30: Launching on nid006756 (30/64), master nid006726 port 9999, GPUs 8, CUDA: True +33: Launching on nid006759 (33/64), master nid006726 port 9999, GPUs 8, CUDA: True + 2: Launching on nid006728 (2/64), master nid006726 port 9999, GPUs 8, CUDA: True +26: Launching on nid006752 (26/64), master nid006726 port 9999, GPUs 8, CUDA: True +55: Launching on nid007018 (55/64), master nid006726 port 9999, GPUs 8, CUDA: True +22: Launching on nid006748 (22/64), master nid006726 port 9999, GPUs 8, CUDA: True +43: Launching on nid007006 (43/64), master nid006726 port 9999, GPUs 8, CUDA: True + 0: Launching on nid006726 (0/64), master nid006726 port 9999, GPUs 8, CUDA: True +41: Launching on nid007004 (41/64), master nid006726 port 9999, GPUs 8, CUDA: True + 7: Launching on nid006733 (7/64), master nid006726 port 9999, GPUs 8, CUDA: True +15: Launching on nid006741 (15/64), master nid006726 port 9999, GPUs 8, CUDA: True +24: Launching on nid006750 (24/64), master nid006726 port 9999, GPUs 8, CUDA: True +60: Launching on nid007023 (60/64), master nid006726 port 9999, GPUs 8, CUDA: True +20: Launching on nid006746 (20/64), master nid006726 port 9999, GPUs 8, CUDA: True +19: Launching on nid006745 (19/64), master nid006726 port 9999, GPUs 8, CUDA: True +11: Launching on nid006737 (11/64), master nid006726 port 9999, GPUs 8, CUDA: True +57: Launching on nid007020 (57/64), master nid006726 port 9999, GPUs 8, CUDA: True +59: Launching on nid007022 (59/64), master nid006726 port 9999, GPUs 8, CUDA: True +18: Launching on nid006744 (18/64), master nid006726 port 9999, GPUs 8, CUDA: True +52: Launching on nid007015 (52/64), master nid006726 port 9999, GPUs 8, CUDA: True +28: Launching on nid006754 (28/64), master nid006726 port 9999, GPUs 8, CUDA: True +48: Launching on nid007011 (48/64), master nid006726 port 9999, GPUs 8, CUDA: True +37: Launching on nid007000 (37/64), master nid006726 port 9999, GPUs 8, CUDA: True +25: Launching on nid006751 (25/64), master nid006726 port 9999, GPUs 8, CUDA: True + 5: Launching on nid006731 (5/64), master nid006726 port 9999, GPUs 8, CUDA: True +34: Launching on nid006997 (34/64), master nid006726 port 9999, GPUs 8, CUDA: True +50: Launching on nid007013 (50/64), master nid006726 port 9999, GPUs 8, CUDA: True +62: Launching on nid007025 (62/64), master nid006726 port 9999, GPUs 8, CUDA: True + 1: Launching on nid006727 (1/64), master nid006726 port 9999, GPUs 8, CUDA: True + 4: Launching on nid006730 (4/64), master nid006726 port 9999, GPUs 8, CUDA: True + 3: Launching on nid006729 (3/64), master nid006726 port 9999, GPUs 8, CUDA: True +44: Launching on nid007007 (44/64), master nid006726 port 9999, GPUs 8, CUDA: True + 8: Launching on nid006734 (8/64), master nid006726 port 9999, GPUs 8, CUDA: True +16: Launching on nid006742 (16/64), master nid006726 port 9999, GPUs 8, CUDA: True +32: Launching on nid006758 (32/64), master nid006726 port 9999, GPUs 8, CUDA: True +61: Launching on nid007024 (61/64), master nid006726 port 9999, GPUs 8, CUDA: True +56: Launching on nid007019 (56/64), master nid006726 port 9999, GPUs 8, CUDA: True +54: Launching on nid007017 (54/64), master nid006726 port 9999, GPUs 8, CUDA: True +29: Launching on nid006755 (29/64), master nid006726 port 9999, GPUs 8, CUDA: True +21: Launching on nid006747 (21/64), master nid006726 port 9999, GPUs 8, CUDA: True +12: Launching on nid006738 (12/64), master nid006726 port 9999, GPUs 8, CUDA: True +17: Launching on nid006743 (17/64), master nid006726 port 9999, GPUs 8, CUDA: True +38: Launching on nid007001 (38/64), master nid006726 port 9999, GPUs 8, CUDA: True +10: Launching on nid006736 (10/64), master nid006726 port 9999, GPUs 8, CUDA: True + 9: Launching on nid006735 (9/64), master nid006726 port 9999, GPUs 8, CUDA: True +47: Launching on nid007010 (47/64), master nid006726 port 9999, GPUs 8, CUDA: True +51: Launching on nid007014 (51/64), master nid006726 port 9999, GPUs 8, CUDA: True +46: Launching on nid007009 (46/64), master nid006726 port 9999, GPUs 8, CUDA: True + 0: using world size: 512, data-parallel-size: 128, tensor-model-parallel size: 2, pipeline-model-parallel size: 2 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 128 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3430925.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 16384 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 512 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 4096 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-8b7178b44bval + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-8b7-178b-c4-repetitions/8b7178b44b + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 1 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 32 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 42 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 0 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 2 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-8b7-178b-c4-repetitions/8b7178b44b + 0: save_interval ................................... 5000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 2 + 0: tensorboard_dir ................................. tensorboard_8b7178b44bval + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 0 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 512 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 4 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 175 dummy tokens (new size: 50432) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-04-29 10:57:33,107] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl +63: > setting tensorboard ... + 0: > initializing tensor model parallel with size 2 + 0: > initializing pipeline model parallel with size 2 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.095 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 102 + 0: [1/1] c++ scaled_masked_softmax_hip.cuda.o scaled_masked_softmax_hip.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o scaled_masked_softmax_cuda.so + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: [1/1] c++ layer_norm_cuda.o layer_norm_hip_kernel.cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o fused_mix_prec_layer_norm_cuda.so + 0: >>> done with compiling and loading fused kernels. Compilation time: 37.880 seconds + 0: time to initialize megatron (seconds): 30.539 + 0: [after megatron is initialized] datetime: 2023-04-29 10:58:22 + 0: building GPT model ... + 0: [2023-04-29 10:58:22,708] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-04-29 10:58:22,709] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-04-29 10:58:22,709] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.44 GB, percent = 7.8% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=0, model=1): 1, ProcessCoord(pipe=0, data=1, model=0): 2, ProcessCoord(pipe=0, data=1, model=1): 3, ProcessCoord(pipe=0, data=2, model=0): 4, ProcessCoord(pipe=0, data=2, model=1): 5, ProcessCoord(pipe=0, data=3, model=0): 6, ProcessCoord(pipe=0, data=3, model=1): 7, ProcessCoord(pipe=0, data=4, model=0): 8, ProcessCoord(pipe=0, data=4, model=1): 9, ProcessCoord(pipe=0, data=5, model=0): 10, ProcessCoord(pipe=0, data=5, model=1): 11, ProcessCoord(pipe=0, data=6, model=0): 12, ProcessCoord(pipe=0, data=6, model=1): 13, ProcessCoord(pipe=0, data=7, model=0): 14, ProcessCoord(pipe=0, data=7, model=1): 15, ProcessCoord(pipe=0, data=8, model=0): 16, ProcessCoord(pipe=0, data=8, model=1): 17, ProcessCoord(pipe=0, data=9, model=0): 18, ProcessCoord(pipe=0, data=9, model=1): 19, ProcessCoord(pipe=0, data=10, model=0): 20, ProcessCoord(pipe=0, data=10, model=1): 21, ProcessCoord(pipe=0, data=11, model=0): 22, ProcessCoord(pipe=0, data + 0: =11, model=1): 23, ProcessCoord(pipe=0, data=12, model=0): 24, ProcessCoord(pipe=0, data=12, model=1): 25, ProcessCoord(pipe=0, data=13, model=0): 26, ProcessCoord(pipe=0, data=13, model=1): 27, ProcessCoord(pipe=0, data=14, model=0): 28, ProcessCoord(pipe=0, data=14, model=1): 29, ProcessCoord(pipe=0, data=15, model=0): 30, ProcessCoord(pipe=0, data=15, model=1): 31, ProcessCoord(pipe=0, data=16, model=0): 32, ProcessCoord(pipe=0, data=16, model=1): 33, ProcessCoord(pipe=0, data=17, model=0): 34, ProcessCoord(pipe=0, data=17, model=1): 35, ProcessCoord(pipe=0, data=18, model=0): 36, ProcessCoord(pipe=0, data=18, model=1): 37, ProcessCoord(pipe=0, data=19, model=0): 38, ProcessCoord(pipe=0, data=19, model=1): 39, ProcessCoord(pipe=0, data=20, model=0): 40, ProcessCoord(pipe=0, data=20, model=1): 41, ProcessCoord(pipe=0, data=21, model=0): 42, ProcessCoord(pipe=0, data=21, model=1): 43, ProcessCoord(pipe=0, data=22, model=0): 44, ProcessCoord(pipe=0, data=22, model=1): 45, ProcessCoord(pipe=0, data=23, model=0 + 0: ): 46, ProcessCoord(pipe=0, data=23, model=1): 47, ProcessCoord(pipe=0, data=24, model=0): 48, ProcessCoord(pipe=0, data=24, model=1): 49, ProcessCoord(pipe=0, data=25, model=0): 50, ProcessCoord(pipe=0, data=25, model=1): 51, ProcessCoord(pipe=0, data=26, model=0): 52, ProcessCoord(pipe=0, data=26, model=1): 53, ProcessCoord(pipe=0, data=27, model=0): 54, ProcessCoord(pipe=0, data=27, model=1): 55, ProcessCoord(pipe=0, data=28, model=0): 56, ProcessCoord(pipe=0, data=28, model=1): 57, ProcessCoord(pipe=0, data=29, model=0): 58, ProcessCoord(pipe=0, data=29, model=1): 59, ProcessCoord(pipe=0, data=30, model=0): 60, ProcessCoord(pipe=0, data=30, model=1): 61, ProcessCoord(pipe=0, data=31, model=0): 62, ProcessCoord(pipe=0, data=31, model=1): 63, ProcessCoord(pipe=0, data=32, model=0): 64, ProcessCoord(pipe=0, data=32, model=1): 65, ProcessCoord(pipe=0, data=33, model=0): 66, ProcessCoord(pipe=0, data=33, model=1): 67, ProcessCoord(pipe=0, data=34, model=0): 68, ProcessCoord(pipe=0, data=34, model=1): 69, Proce + 0: ssCoord(pipe=0, data=35, model=0): 70, ProcessCoord(pipe=0, data=35, model=1): 71, ProcessCoord(pipe=0, data=36, model=0): 72, ProcessCoord(pipe=0, data=36, model=1): 73, ProcessCoord(pipe=0, data=37, model=0): 74, ProcessCoord(pipe=0, data=37, model=1): 75, ProcessCoord(pipe=0, data=38, model=0): 76, ProcessCoord(pipe=0, data=38, model=1): 77, ProcessCoord(pipe=0, data=39, model=0): 78, ProcessCoord(pipe=0, data=39, model=1): 79, ProcessCoord(pipe=0, data=40, model=0): 80, ProcessCoord(pipe=0, data=40, model=1): 81, ProcessCoord(pipe=0, data=41, model=0): 82, ProcessCoord(pipe=0, data=41, model=1): 83, ProcessCoord(pipe=0, data=42, model=0): 84, ProcessCoord(pipe=0, data=42, model=1): 85, ProcessCoord(pipe=0, data=43, model=0): 86, ProcessCoord(pipe=0, data=43, model=1): 87, ProcessCoord(pipe=0, data=44, model=0): 88, ProcessCoord(pipe=0, data=44, model=1): 89, ProcessCoord(pipe=0, data=45, model=0): 90, ProcessCoord(pipe=0, data=45, model=1): 91, ProcessCoord(pipe=0, data=46, model=0): 92, ProcessCoord(pipe + 0: =0, data=46, model=1): 93, ProcessCoord(pipe=0, data=47, model=0): 94, ProcessCoord(pipe=0, data=47, model=1): 95, ProcessCoord(pipe=0, data=48, model=0): 96, ProcessCoord(pipe=0, data=48, model=1): 97, ProcessCoord(pipe=0, data=49, model=0): 98, ProcessCoord(pipe=0, data=49, model=1): 99, ProcessCoord(pipe=0, data=50, model=0): 100, ProcessCoord(pipe=0, data=50, model=1): 101, ProcessCoord(pipe=0, data=51, model=0): 102, ProcessCoord(pipe=0, data=51, model=1): 103, ProcessCoord(pipe=0, data=52, model=0): 104, ProcessCoord(pipe=0, data=52, model=1): 105, ProcessCoord(pipe=0, data=53, model=0): 106, ProcessCoord(pipe=0, data=53, model=1): 107, ProcessCoord(pipe=0, data=54, model=0): 108, ProcessCoord(pipe=0, data=54, model=1): 109, ProcessCoord(pipe=0, data=55, model=0): 110, ProcessCoord(pipe=0, data=55, model=1): 111, ProcessCoord(pipe=0, data=56, model=0): 112, ProcessCoord(pipe=0, data=56, model=1): 113, ProcessCoord(pipe=0, data=57, model=0): 114, ProcessCoord(pipe=0, data=57, model=1): 115, ProcessCoord( + 0: pipe=0, data=58, model=0): 116, ProcessCoord(pipe=0, data=58, model=1): 117, ProcessCoord(pipe=0, data=59, model=0): 118, ProcessCoord(pipe=0, data=59, model=1): 119, ProcessCoord(pipe=0, data=60, model=0): 120, ProcessCoord(pipe=0, data=60, model=1): 121, ProcessCoord(pipe=0, data=61, model=0): 122, ProcessCoord(pipe=0, data=61, model=1): 123, ProcessCoord(pipe=0, data=62, model=0): 124, ProcessCoord(pipe=0, data=62, model=1): 125, ProcessCoord(pipe=0, data=63, model=0): 126, ProcessCoord(pipe=0, data=63, model=1): 127, ProcessCoord(pipe=0, data=64, model=0): 128, ProcessCoord(pipe=0, data=64, model=1): 129, ProcessCoord(pipe=0, data=65, model=0): 130, ProcessCoord(pipe=0, data=65, model=1): 131, ProcessCoord(pipe=0, data=66, model=0): 132, ProcessCoord(pipe=0, data=66, model=1): 133, ProcessCoord(pipe=0, data=67, model=0): 134, ProcessCoord(pipe=0, data=67, model=1): 135, ProcessCoord(pipe=0, data=68, model=0): 136, ProcessCoord(pipe=0, data=68, model=1): 137, ProcessCoord(pipe=0, data=69, model=0): 138, Pr + 0: ocessCoord(pipe=0, data=69, model=1): 139, ProcessCoord(pipe=0, data=70, model=0): 140, ProcessCoord(pipe=0, data=70, model=1): 141, ProcessCoord(pipe=0, data=71, model=0): 142, ProcessCoord(pipe=0, data=71, model=1): 143, ProcessCoord(pipe=0, data=72, model=0): 144, ProcessCoord(pipe=0, data=72, model=1): 145, ProcessCoord(pipe=0, data=73, model=0): 146, ProcessCoord(pipe=0, data=73, model=1): 147, ProcessCoord(pipe=0, data=74, model=0): 148, ProcessCoord(pipe=0, data=74, model=1): 149, ProcessCoord(pipe=0, data=75, model=0): 150, ProcessCoord(pipe=0, data=75, model=1): 151, ProcessCoord(pipe=0, data=76, model=0): 152, ProcessCoord(pipe=0, data=76, model=1): 153, ProcessCoord(pipe=0, data=77, model=0): 154, ProcessCoord(pipe=0, data=77, model=1): 155, ProcessCoord(pipe=0, data=78, model=0): 156, ProcessCoord(pipe=0, data=78, model=1): 157, ProcessCoord(pipe=0, data=79, model=0): 158, ProcessCoord(pipe=0, data=79, model=1): 159, ProcessCoord(pipe=0, data=80, model=0): 160, ProcessCoord(pipe=0, data=80, model= + 0: 1): 161, ProcessCoord(pipe=0, data=81, model=0): 162, ProcessCoord(pipe=0, data=81, model=1): 163, ProcessCoord(pipe=0, data=82, model=0): 164, ProcessCoord(pipe=0, data=82, model=1): 165, ProcessCoord(pipe=0, data=83, model=0): 166, ProcessCoord(pipe=0, data=83, model=1): 167, ProcessCoord(pipe=0, data=84, model=0): 168, ProcessCoord(pipe=0, data=84, model=1): 169, ProcessCoord(pipe=0, data=85, model=0): 170, ProcessCoord(pipe=0, data=85, model=1): 171, ProcessCoord(pipe=0, data=86, model=0): 172, ProcessCoord(pipe=0, data=86, model=1): 173, ProcessCoord(pipe=0, data=87, model=0): 174, ProcessCoord(pipe=0, data=87, model=1): 175, ProcessCoord(pipe=0, data=88, model=0): 176, ProcessCoord(pipe=0, data=88, model=1): 177, ProcessCoord(pipe=0, data=89, model=0): 178, ProcessCoord(pipe=0, data=89, model=1): 179, ProcessCoord(pipe=0, data=90, model=0): 180, ProcessCoord(pipe=0, data=90, model=1): 181, ProcessCoord(pipe=0, data=91, model=0): 182, ProcessCoord(pipe=0, data=91, model=1): 183, ProcessCoord(pipe=0, data + 0: =92, model=0): 184, ProcessCoord(pipe=0, data=92, model=1): 185, ProcessCoord(pipe=0, data=93, model=0): 186, ProcessCoord(pipe=0, data=93, model=1): 187, ProcessCoord(pipe=0, data=94, model=0): 188, ProcessCoord(pipe=0, data=94, model=1): 189, ProcessCoord(pipe=0, data=95, model=0): 190, ProcessCoord(pipe=0, data=95, model=1): 191, ProcessCoord(pipe=0, data=96, model=0): 192, ProcessCoord(pipe=0, data=96, model=1): 193, ProcessCoord(pipe=0, data=97, model=0): 194, ProcessCoord(pipe=0, data=97, model=1): 195, ProcessCoord(pipe=0, data=98, model=0): 196, ProcessCoord(pipe=0, data=98, model=1): 197, ProcessCoord(pipe=0, data=99, model=0): 198, ProcessCoord(pipe=0, data=99, model=1): 199, ProcessCoord(pipe=0, data=100, model=0): 200, ProcessCoord(pipe=0, data=100, model=1): 201, ProcessCoord(pipe=0, data=101, model=0): 202, ProcessCoord(pipe=0, data=101, model=1): 203, ProcessCoord(pipe=0, data=102, model=0): 204, ProcessCoord(pipe=0, data=102, model=1): 205, ProcessCoord(pipe=0, data=103, model=0): 206, Process + 0: Coord(pipe=0, data=103, model=1): 207, ProcessCoord(pipe=0, data=104, model=0): 208, ProcessCoord(pipe=0, data=104, model=1): 209, ProcessCoord(pipe=0, data=105, model=0): 210, ProcessCoord(pipe=0, data=105, model=1): 211, ProcessCoord(pipe=0, data=106, model=0): 212, ProcessCoord(pipe=0, data=106, model=1): 213, ProcessCoord(pipe=0, data=107, model=0): 214, ProcessCoord(pipe=0, data=107, model=1): 215, ProcessCoord(pipe=0, data=108, model=0): 216, ProcessCoord(pipe=0, data=108, model=1): 217, ProcessCoord(pipe=0, data=109, model=0): 218, ProcessCoord(pipe=0, data=109, model=1): 219, ProcessCoord(pipe=0, data=110, model=0): 220, ProcessCoord(pipe=0, data=110, model=1): 221, ProcessCoord(pipe=0, data=111, model=0): 222, ProcessCoord(pipe=0, data=111, model=1): 223, ProcessCoord(pipe=0, data=112, model=0): 224, ProcessCoord(pipe=0, data=112, model=1): 225, ProcessCoord(pipe=0, data=113, model=0): 226, ProcessCoord(pipe=0, data=113, model=1): 227, ProcessCoord(pipe=0, data=114, model=0): 228, ProcessCoord(pipe=0 + 0: , data=114, model=1): 229, ProcessCoord(pipe=0, data=115, model=0): 230, ProcessCoord(pipe=0, data=115, model=1): 231, ProcessCoord(pipe=0, data=116, model=0): 232, ProcessCoord(pipe=0, data=116, model=1): 233, ProcessCoord(pipe=0, data=117, model=0): 234, ProcessCoord(pipe=0, data=117, model=1): 235, ProcessCoord(pipe=0, data=118, model=0): 236, ProcessCoord(pipe=0, data=118, model=1): 237, ProcessCoord(pipe=0, data=119, model=0): 238, ProcessCoord(pipe=0, data=119, model=1): 239, ProcessCoord(pipe=0, data=120, model=0): 240, ProcessCoord(pipe=0, data=120, model=1): 241, ProcessCoord(pipe=0, data=121, model=0): 242, ProcessCoord(pipe=0, data=121, model=1): 243, ProcessCoord(pipe=0, data=122, model=0): 244, ProcessCoord(pipe=0, data=122, model=1): 245, ProcessCoord(pipe=0, data=123, model=0): 246, ProcessCoord(pipe=0, data=123, model=1): 247, ProcessCoord(pipe=0, data=124, model=0): 248, ProcessCoord(pipe=0, data=124, model=1): 249, ProcessCoord(pipe=0, data=125, model=0): 250, ProcessCoord(pipe=0, data=125, + 0: model=1): 251, ProcessCoord(pipe=0, data=126, model=0): 252, ProcessCoord(pipe=0, data=126, model=1): 253, ProcessCoord(pipe=0, data=127, model=0): 254, ProcessCoord(pipe=0, data=127, model=1): 255, ProcessCoord(pipe=1, data=0, model=0): 256, ProcessCoord(pipe=1, data=0, model=1): 257, ProcessCoord(pipe=1, data=1, model=0): 258, ProcessCoord(pipe=1, data=1, model=1): 259, ProcessCoord(pipe=1, data=2, model=0): 260, ProcessCoord(pipe=1, data=2, model=1): 261, ProcessCoord(pipe=1, data=3, model=0): 262, ProcessCoord(pipe=1, data=3, model=1): 263, ProcessCoord(pipe=1, data=4, model=0): 264, ProcessCoord(pipe=1, data=4, model=1): 265, ProcessCoord(pipe=1, data=5, model=0): 266, ProcessCoord(pipe=1, data=5, model=1): 267, ProcessCoord(pipe=1, data=6, model=0): 268, ProcessCoord(pipe=1, data=6, model=1): 269, ProcessCoord(pipe=1, data=7, model=0): 270, ProcessCoord(pipe=1, data=7, model=1): 271, ProcessCoord(pipe=1, data=8, model=0): 272, ProcessCoord(pipe=1, data=8, model=1): 273, ProcessCoord(pipe=1, data=9, mode + 0: l=0): 274, ProcessCoord(pipe=1, data=9, model=1): 275, ProcessCoord(pipe=1, data=10, model=0): 276, ProcessCoord(pipe=1, data=10, model=1): 277, ProcessCoord(pipe=1, data=11, model=0): 278, ProcessCoord(pipe=1, data=11, model=1): 279, ProcessCoord(pipe=1, data=12, model=0): 280, ProcessCoord(pipe=1, data=12, model=1): 281, ProcessCoord(pipe=1, data=13, model=0): 282, ProcessCoord(pipe=1, data=13, model=1): 283, ProcessCoord(pipe=1, data=14, model=0): 284, ProcessCoord(pipe=1, data=14, model=1): 285, ProcessCoord(pipe=1, data=15, model=0): 286, ProcessCoord(pipe=1, data=15, model=1): 287, ProcessCoord(pipe=1, data=16, model=0): 288, ProcessCoord(pipe=1, data=16, model=1): 289, ProcessCoord(pipe=1, data=17, model=0): 290, ProcessCoord(pipe=1, data=17, model=1): 291, ProcessCoord(pipe=1, data=18, model=0): 292, ProcessCoord(pipe=1, data=18, model=1): 293, ProcessCoord(pipe=1, data=19, model=0): 294, ProcessCoord(pipe=1, data=19, model=1): 295, ProcessCoord(pipe=1, data=20, model=0): 296, ProcessCoord(pipe=1, dat + 0: a=20, model=1): 297, ProcessCoord(pipe=1, data=21, model=0): 298, ProcessCoord(pipe=1, data=21, model=1): 299, ProcessCoord(pipe=1, data=22, model=0): 300, ProcessCoord(pipe=1, data=22, model=1): 301, ProcessCoord(pipe=1, data=23, model=0): 302, ProcessCoord(pipe=1, data=23, model=1): 303, ProcessCoord(pipe=1, data=24, model=0): 304, ProcessCoord(pipe=1, data=24, model=1): 305, ProcessCoord(pipe=1, data=25, model=0): 306, ProcessCoord(pipe=1, data=25, model=1): 307, ProcessCoord(pipe=1, data=26, model=0): 308, ProcessCoord(pipe=1, data=26, model=1): 309, ProcessCoord(pipe=1, data=27, model=0): 310, ProcessCoord(pipe=1, data=27, model=1): 311, ProcessCoord(pipe=1, data=28, model=0): 312, ProcessCoord(pipe=1, data=28, model=1): 313, ProcessCoord(pipe=1, data=29, model=0): 314, ProcessCoord(pipe=1, data=29, model=1): 315, ProcessCoord(pipe=1, data=30, model=0): 316, ProcessCoord(pipe=1, data=30, model=1): 317, ProcessCoord(pipe=1, data=31, model=0): 318, ProcessCoord(pipe=1, data=31, model=1): 319, ProcessCoord( + 0: pipe=1, data=32, model=0): 320, ProcessCoord(pipe=1, data=32, model=1): 321, ProcessCoord(pipe=1, data=33, model=0): 322, ProcessCoord(pipe=1, data=33, model=1): 323, ProcessCoord(pipe=1, data=34, model=0): 324, ProcessCoord(pipe=1, data=34, model=1): 325, ProcessCoord(pipe=1, data=35, model=0): 326, ProcessCoord(pipe=1, data=35, model=1): 327, ProcessCoord(pipe=1, data=36, model=0): 328, ProcessCoord(pipe=1, data=36, model=1): 329, ProcessCoord(pipe=1, data=37, model=0): 330, ProcessCoord(pipe=1, data=37, model=1): 331, ProcessCoord(pipe=1, data=38, model=0): 332, ProcessCoord(pipe=1, data=38, model=1): 333, ProcessCoord(pipe=1, data=39, model=0): 334, ProcessCoord(pipe=1, data=39, model=1): 335, ProcessCoord(pipe=1, data=40, model=0): 336, ProcessCoord(pipe=1, data=40, model=1): 337, ProcessCoord(pipe=1, data=41, model=0): 338, ProcessCoord(pipe=1, data=41, model=1): 339, ProcessCoord(pipe=1, data=42, model=0): 340, ProcessCoord(pipe=1, data=42, model=1): 341, ProcessCoord(pipe=1, data=43, model=0): 342, Pr + 0: ocessCoord(pipe=1, data=43, model=1): 343, ProcessCoord(pipe=1, data=44, model=0): 344, ProcessCoord(pipe=1, data=44, model=1): 345, ProcessCoord(pipe=1, data=45, model=0): 346, ProcessCoord(pipe=1, data=45, model=1): 347, ProcessCoord(pipe=1, data=46, model=0): 348, ProcessCoord(pipe=1, data=46, model=1): 349, ProcessCoord(pipe=1, data=47, model=0): 350, ProcessCoord(pipe=1, data=47, model=1): 351, ProcessCoord(pipe=1, data=48, model=0): 352, ProcessCoord(pipe=1, data=48, model=1): 353, ProcessCoord(pipe=1, data=49, model=0): 354, ProcessCoord(pipe=1, data=49, model=1): 355, ProcessCoord(pipe=1, data=50, model=0): 356, ProcessCoord(pipe=1, data=50, model=1): 357, ProcessCoord(pipe=1, data=51, model=0): 358, ProcessCoord(pipe=1, data=51, model=1): 359, ProcessCoord(pipe=1, data=52, model=0): 360, ProcessCoord(pipe=1, data=52, model=1): 361, ProcessCoord(pipe=1, data=53, model=0): 362, ProcessCoord(pipe=1, data=53, model=1): 363, ProcessCoord(pipe=1, data=54, model=0): 364, ProcessCoord(pipe=1, data=54, model= + 0: 1): 365, ProcessCoord(pipe=1, data=55, model=0): 366, ProcessCoord(pipe=1, data=55, model=1): 367, ProcessCoord(pipe=1, data=56, model=0): 368, ProcessCoord(pipe=1, data=56, model=1): 369, ProcessCoord(pipe=1, data=57, model=0): 370, ProcessCoord(pipe=1, data=57, model=1): 371, ProcessCoord(pipe=1, data=58, model=0): 372, ProcessCoord(pipe=1, data=58, model=1): 373, ProcessCoord(pipe=1, data=59, model=0): 374, ProcessCoord(pipe=1, data=59, model=1): 375, ProcessCoord(pipe=1, data=60, model=0): 376, ProcessCoord(pipe=1, data=60, model=1): 377, ProcessCoord(pipe=1, data=61, model=0): 378, ProcessCoord(pipe=1, data=61, model=1): 379, ProcessCoord(pipe=1, data=62, model=0): 380, ProcessCoord(pipe=1, data=62, model=1): 381, ProcessCoord(pipe=1, data=63, model=0): 382, ProcessCoord(pipe=1, data=63, model=1): 383, ProcessCoord(pipe=1, data=64, model=0): 384, ProcessCoord(pipe=1, data=64, model=1): 385, ProcessCoord(pipe=1, data=65, model=0): 386, ProcessCoord(pipe=1, data=65, model=1): 387, ProcessCoord(pipe=1, data + 0: =66, model=0): 388, ProcessCoord(pipe=1, data=66, model=1): 389, ProcessCoord(pipe=1, data=67, model=0): 390, ProcessCoord(pipe=1, data=67, model=1): 391, ProcessCoord(pipe=1, data=68, model=0): 392, ProcessCoord(pipe=1, data=68, model=1): 393, ProcessCoord(pipe=1, data=69, model=0): 394, ProcessCoord(pipe=1, data=69, model=1): 395, ProcessCoord(pipe=1, data=70, model=0): 396, ProcessCoord(pipe=1, data=70, model=1): 397, ProcessCoord(pipe=1, data=71, model=0): 398, ProcessCoord(pipe=1, data=71, model=1): 399, ProcessCoord(pipe=1, data=72, model=0): 400, ProcessCoord(pipe=1, data=72, model=1): 401, ProcessCoord(pipe=1, data=73, model=0): 402, ProcessCoord(pipe=1, data=73, model=1): 403, ProcessCoord(pipe=1, data=74, model=0): 404, ProcessCoord(pipe=1, data=74, model=1): 405, ProcessCoord(pipe=1, data=75, model=0): 406, ProcessCoord(pipe=1, data=75, model=1): 407, ProcessCoord(pipe=1, data=76, model=0): 408, ProcessCoord(pipe=1, data=76, model=1): 409, ProcessCoord(pipe=1, data=77, model=0): 410, ProcessCoord(p + 0: ipe=1, data=77, model=1): 411, ProcessCoord(pipe=1, data=78, model=0): 412, ProcessCoord(pipe=1, data=78, model=1): 413, ProcessCoord(pipe=1, data=79, model=0): 414, ProcessCoord(pipe=1, data=79, model=1): 415, ProcessCoord(pipe=1, data=80, model=0): 416, ProcessCoord(pipe=1, data=80, model=1): 417, ProcessCoord(pipe=1, data=81, model=0): 418, ProcessCoord(pipe=1, data=81, model=1): 419, ProcessCoord(pipe=1, data=82, model=0): 420, ProcessCoord(pipe=1, data=82, model=1): 421, ProcessCoord(pipe=1, data=83, model=0): 422, ProcessCoord(pipe=1, data=83, model=1): 423, ProcessCoord(pipe=1, data=84, model=0): 424, ProcessCoord(pipe=1, data=84, model=1): 425, ProcessCoord(pipe=1, data=85, model=0): 426, ProcessCoord(pipe=1, data=85, model=1): 427, ProcessCoord(pipe=1, data=86, model=0): 428, ProcessCoord(pipe=1, data=86, model=1): 429, ProcessCoord(pipe=1, data=87, model=0): 430, ProcessCoord(pipe=1, data=87, model=1): 431, ProcessCoord(pipe=1, data=88, model=0): 432, ProcessCoord(pipe=1, data=88, model=1): 433, Pro + 0: cessCoord(pipe=1, data=89, model=0): 434, ProcessCoord(pipe=1, data=89, model=1): 435, ProcessCoord(pipe=1, data=90, model=0): 436, ProcessCoord(pipe=1, data=90, model=1): 437, ProcessCoord(pipe=1, data=91, model=0): 438, ProcessCoord(pipe=1, data=91, model=1): 439, ProcessCoord(pipe=1, data=92, model=0): 440, ProcessCoord(pipe=1, data=92, model=1): 441, ProcessCoord(pipe=1, data=93, model=0): 442, ProcessCoord(pipe=1, data=93, model=1): 443, ProcessCoord(pipe=1, data=94, model=0): 444, ProcessCoord(pipe=1, data=94, model=1): 445, ProcessCoord(pipe=1, data=95, model=0): 446, ProcessCoord(pipe=1, data=95, model=1): 447, ProcessCoord(pipe=1, data=96, model=0): 448, ProcessCoord(pipe=1, data=96, model=1): 449, ProcessCoord(pipe=1, data=97, model=0): 450, ProcessCoord(pipe=1, data=97, model=1): 451, ProcessCoord(pipe=1, data=98, model=0): 452, ProcessCoord(pipe=1, data=98, model=1): 453, ProcessCoord(pipe=1, data=99, model=0): 454, ProcessCoord(pipe=1, data=99, model=1): 455, ProcessCoord(pipe=1, data=100, model= + 0: 0): 456, ProcessCoord(pipe=1, data=100, model=1): 457, ProcessCoord(pipe=1, data=101, model=0): 458, ProcessCoord(pipe=1, data=101, model=1): 459, ProcessCoord(pipe=1, data=102, model=0): 460, ProcessCoord(pipe=1, data=102, model=1): 461, ProcessCoord(pipe=1, data=103, model=0): 462, ProcessCoord(pipe=1, data=103, model=1): 463, ProcessCoord(pipe=1, data=104, model=0): 464, ProcessCoord(pipe=1, data=104, model=1): 465, ProcessCoord(pipe=1, data=105, model=0): 466, ProcessCoord(pipe=1, data=105, model=1): 467, ProcessCoord(pipe=1, data=106, model=0): 468, ProcessCoord(pipe=1, data=106, model=1): 469, ProcessCoord(pipe=1, data=107, model=0): 470, ProcessCoord(pipe=1, data=107, model=1): 471, ProcessCoord(pipe=1, data=108, model=0): 472, ProcessCoord(pipe=1, data=108, model=1): 473, ProcessCoord(pipe=1, data=109, model=0): 474, ProcessCoord(pipe=1, data=109, model=1): 475, ProcessCoord(pipe=1, data=110, model=0): 476, ProcessCoord(pipe=1, data=110, model=1): 477, ProcessCoord(pipe=1, data=111, model=0): 478, Pro + 0: cessCoord(pipe=1, data=111, model=1): 479, ProcessCoord(pipe=1, data=112, model=0): 480, ProcessCoord(pipe=1, data=112, model=1): 481, ProcessCoord(pipe=1, data=113, model=0): 482, ProcessCoord(pipe=1, data=113, model=1): 483, ProcessCoord(pipe=1, data=114, model=0): 484, ProcessCoord(pipe=1, data=114, model=1): 485, ProcessCoord(pipe=1, data=115, model=0): 486, ProcessCoord(pipe=1, data=115, model=1): 487, ProcessCoord(pipe=1, data=116, model=0): 488, ProcessCoord(pipe=1, data=116, model=1): 489, ProcessCoord(pipe=1, data=117, model=0): 490, ProcessCoord(pipe=1, data=117, model=1): 491, ProcessCoord(pipe=1, data=118, model=0): 492, ProcessCoord(pipe=1, data=118, model=1): 493, ProcessCoord(pipe=1, data=119, model=0): 494, ProcessCoord(pipe=1, data=119, model=1): 495, ProcessCoord(pipe=1, data=120, model=0): 496, ProcessCoord(pipe=1, data=120, model=1): 497, ProcessCoord(pipe=1, data=121, model=0): 498, ProcessCoord(pipe=1, data=121, model=1): 499, ProcessCoord(pipe=1, data=122, model=0): 500, ProcessCoord(pi + 0: pe=1, data=122, model=1): 501, ProcessCoord(pipe=1, data=123, model=0): 502, ProcessCoord(pipe=1, data=123, model=1): 503, ProcessCoord(pipe=1, data=124, model=0): 504, ProcessCoord(pipe=1, data=124, model=1): 505, ProcessCoord(pipe=1, data=125, model=0): 506, ProcessCoord(pipe=1, data=125, model=1): 507, ProcessCoord(pipe=1, data=126, model=0): 508, ProcessCoord(pipe=1, data=126, model=1): 509, ProcessCoord(pipe=1, data=127, model=0): 510, ProcessCoord(pipe=1, data=127, model=1): 511} + 0: [2023-04-29 10:58:30,313] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=24 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: stage=1 layers=25 + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: ParallelTransformerLayerPipe + 0: 38: ParallelTransformerLayerPipe + 0: 39: ParallelTransformerLayerPipe + 0: 40: ParallelTransformerLayerPipe + 0: 41: ParallelTransformerLayerPipe + 0: 42: ParallelTransformerLayerPipe + 0: 43: ParallelTransformerLayerPipe + 0: 44: ParallelTransformerLayerPipe + 0: 45: undo + 0: 46: MixedFusedLayerNorm + 0: 47: EmbeddingPipe + 0: 48: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-04-29 10:58:33,933] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-04-29 10:58:33,934] [INFO] [utils.py:828:see_memory_usage] MA 4.16 GB Max_MA 4.16 GB CA 4.17 GB Max_CA 4 GB + 0: [2023-04-29 10:58:33,934] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.3 GB, percent = 8.0% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-04-29 10:58:33,936] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-04-29 10:58:38,436] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-04-29 10:58:38,436] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-04-29 10:58:38,436] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-04-29 10:58:38,445] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-04-29 10:58:38,445] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-04-29 10:58:38,571] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-04-29 10:58:38,571] [INFO] [utils.py:828:see_memory_usage] MA 4.15 GB Max_MA 4.18 GB CA 4.18 GB Max_CA 4 GB + 0: [2023-04-29 10:58:38,572] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.94 GB, percent = 8.1% +23: Time to load utils op: 0.3386049270629883 secondsTime to load utils op: 0.33878493309020996 secondsTime to load utils op: 0.3387587070465088 seconds +23: +23: +23: Time to load utils op: 0.33876705169677734 seconds +22: Time to load utils op: 0.33524227142333984 seconds +22: Time to load utils op: 0.33525729179382324 seconds +22: Time to load utils op: 0.3352646827697754 seconds +22: Time to load utils op: 0.33527159690856934 seconds +24: Time to load utils op: 0.33569765090942383 seconds +24: Time to load utils op: 0.33569884300231934 seconds +24: Time to load utils op: 0.3357064723968506 seconds +24: Time to load utils op: 0.3357081413269043 seconds +14: Time to load utils op: 0.33652424812316895 secondsTime to load utils op: 0.33652377128601074 seconds +14: +14: Time to load utils op: 0.33653807640075684 seconds +14: Time to load utils op: 0.3365452289581299 seconds +29: Time to load utils op: 0.33458447456359863 secondsTime to load utils op: 0.33458566665649414 seconds +29: +29: Time to load utils op: 0.3346071243286133 seconds +29: Time to load utils op: 0.33463096618652344 seconds +17: Time to load utils op: 0.33716726303100586 secondsTime to load utils op: 0.3371732234954834 secondsTime to load utils op: 0.3371725082397461 seconds +17: +17: +17: Time to load utils op: 0.33718085289001465 seconds +26: Time to load utils op: 0.33652710914611816 seconds +26: Time to load utils op: 0.3365497589111328 secondsTime to load utils op: 0.3365511894226074 seconds +26: +26: Time to load utils op: 0.3365662097930908 seconds +30: Time to load utils op: 0.3350377082824707 secondsTime to load utils op: 0.3350346088409424 seconds +30: +30: Time to load utils op: 0.3350539207458496 secondsTime to load utils op: 0.33506107330322266 seconds +30: +27: Time to load utils op: 0.3374345302581787 seconds +27: Time to load utils op: 0.3374602794647217 seconds +27: Time to load utils op: 0.3374648094177246 seconds +27: Time to load utils op: 0.3374752998352051 seconds +28: Time to load utils op: 0.33722567558288574 seconds +28: Time to load utils op: 0.3372323513031006 seconds +28: Time to load utils op: 0.33722901344299316 seconds +28: Time to load utils op: 0.3372533321380615 seconds +19: Time to load utils op: 0.3399620056152344 secondsTime to load utils op: 0.3399674892425537 seconds +19: Time to load utils op: 0.33995676040649414 seconds +19: +19: Time to load utils op: 0.3399679660797119 seconds + 0: Time to load utils op: 0.20751070976257324 secondsTime to load utils op: 0.20760393142700195 secondsTime to load utils op: 0.20750689506530762 secondsTime to load utils op: 0.1166386604309082 seconds + 0: + 0: + 0: +16: Time to load utils op: 0.3410625457763672 seconds +16: Time to load utils op: 0.34105896949768066 seconds +16: Time to load utils op: 0.34106993675231934 seconds +15: Time to load utils op: 0.3411529064178467 seconds +16: Time to load utils op: 0.3410964012145996 seconds +15: Time to load utils op: 0.3411545753479004 secondsTime to load utils op: 0.34116268157958984 seconds +15: +15: Time to load utils op: 0.3411898612976074 seconds +31: Time to load utils op: 0.33757996559143066 secondsTime to load utils op: 0.33757996559143066 seconds +31: +31: Time to load utils op: 0.337601900100708 seconds +31: Time to load utils op: 0.33761024475097656 seconds +25: Time to load utils op: 0.34186244010925293 secondsTime to load utils op: 0.3418614864349365 seconds +25: +25: Time to load utils op: 0.3418750762939453 seconds +25: Time to load utils op: 0.34189534187316895 seconds +18: Time to load utils op: 0.34240150451660156 seconds +18: Time to load utils op: 0.34242701530456543 seconds +18: Time to load utils op: 0.3423891067504883 seconds +18: Time to load utils op: 0.3424341678619385 seconds + 4: Time to load utils op: 0.20918941497802734 secondsTime to load utils op: 0.2097930908203125 seconds + 4: Time to load utils op: 0.20893120765686035 secondsTime to load utils op: 0.20904898643493652 seconds + 4: + 4: + 1: Time to load utils op: 0.21057510375976562 secondsTime to load utils op: 0.21070027351379395 seconds + 1: + 1: Time to load utils op: 0.21047759056091309 secondsTime to load utils op: 0.21062278747558594 seconds + 1: + 2: Time to load utils op: 0.21067476272583008 secondsTime to load utils op: 0.21061968803405762 secondsTime to load utils op: 0.21065568923950195 seconds + 2: + 2: + 2: Time to load utils op: 0.2105090618133545 seconds + 3: Time to load utils op: 0.2108900547027588 seconds + 3: Time to load utils op: 0.2110443115234375 seconds + 3: Time to load utils op: 0.21116161346435547 seconds + 3: Time to load utils op: 0.21101975440979004 seconds +14: Time to load utils op: 0.20755362510681152 seconds +14: Time to load utils op: 0.20765089988708496 seconds +14: Time to load utils op: 0.20782136917114258 seconds +14: Time to load utils op: 0.20792460441589355 seconds + 6: Time to load utils op: 0.21267127990722656 secondsTime to load utils op: 0.2126917839050293 seconds + 6: Time to load utils op: 0.21280860900878906 seconds + 6: + 6: Time to load utils op: 0.21291375160217285 seconds +16: Time to load utils op: 0.20739006996154785 seconds +16: Time to load utils op: 0.20762062072753906 seconds +16: Time to load utils op: 0.20769786834716797 seconds +15: Time to load utils op: 0.20852327346801758 seconds +15: Time to load utils op: 0.20838594436645508 seconds +16: Time to load utils op: 0.20783114433288574 seconds +19: Time to load utils op: 0.20632719993591309 seconds + 0: Time to load utils op: 0.40467286109924316 seconds +19: Time to load utils op: 0.2059342861175537 seconds +19: Time to load utils op: 0.20592546463012695 seconds +15: Time to load utils op: 0.20901966094970703 seconds +19: Time to load utils op: 0.20639514923095703 seconds +18: Time to load utils op: 0.207258939743042 seconds +18: Time to load utils op: 0.20705533027648926 seconds +18: Time to load utils op: 0.20735692977905273 seconds +17: Time to load utils op: 0.20791912078857422 seconds +18: Time to load utils op: 0.2072739601135254 seconds +15: Time to load utils op: 0.20940446853637695 seconds +17: Time to load utils op: 0.2078855037689209 seconds +17: Time to load utils op: 0.20792436599731445 seconds + 5: Time to load utils op: 0.2141420841217041 secondsTime to load utils op: 0.21419739723205566 secondsTime to load utils op: 0.21420550346374512 seconds + 5: + 5: + 5: Time to load utils op: 0.21402907371520996 seconds + 8: Time to load utils op: 0.21307826042175293 secondsTime to load utils op: 0.2135777473449707 secondsTime to load utils op: 0.21368908882141113 seconds + 8: + 8: + 8: Time to load utils op: 0.21307158470153809 seconds +17: Time to load utils op: 0.20803523063659668 seconds +23: Time to load utils op: 0.20598220825195312 seconds + 7: Time to load utils op: 0.2140331268310547 secondsTime to load utils op: 0.2139415740966797 seconds + 7: + 7: Time to load utils op: 0.21414613723754883 secondsTime to load utils op: 0.21380853652954102 seconds + 7: +23: Time to load utils op: 0.20631003379821777 seconds +23: Time to load utils op: 0.20650672912597656 seconds +22: Time to load utils op: 0.2066047191619873 seconds +23: Time to load utils op: 0.20632386207580566 seconds +22: Time to load utils op: 0.20644187927246094 seconds +22: Time to load utils op: 0.2067859172821045 seconds +24: Time to load utils op: 0.20554208755493164 seconds +24: Time to load utils op: 0.20544195175170898 seconds +22: Time to load utils op: 0.2070176601409912 seconds +24: Time to load utils op: 0.20575666427612305 seconds +24: Time to load utils op: 0.20583772659301758 seconds +10: Time to load utils op: 0.21399712562561035 secondsTime to load utils op: 0.21423602104187012 seconds +10: +10: Time to load utils op: 0.2142183780670166 seconds +10: Time to load utils op: 0.21398067474365234 seconds +26: Time to load utils op: 0.20460772514343262 seconds +26: Time to load utils op: 0.20455574989318848 seconds +26: Time to load utils op: 0.2044355869293213 seconds + 9: Time to load utils op: 0.2143726348876953 seconds + 9: Time to load utils op: 0.21456265449523926 secondsTime to load utils op: 0.21451187133789062 seconds + 9: + 9: Time to load utils op: 0.21465206146240234 seconds +26: Time to load utils op: 0.20495247840881348 seconds +28: Time to load utils op: 0.20292186737060547 seconds +28: Time to load utils op: 0.2038557529449463 secondsTime to load utils op: 0.20345067977905273 seconds +28: +31: Time to load utils op: 0.20273423194885254 seconds +25: Time to load utils op: 0.20526957511901855 secondsTime to load utils op: 0.20545029640197754 secondsTime to load utils op: 0.2052323818206787 seconds +25: +25: +29: Time to load utils op: 0.20349407196044922 seconds +25: Time to load utils op: 0.20545363426208496 seconds +11: Time to load utils op: 0.21358299255371094 secondsTime to load utils op: 0.21339154243469238 seconds +11: +11: Time to load utils op: 0.21417641639709473 secondsTime to load utils op: 0.21421003341674805 seconds +11: +29: Time to load utils op: 0.2039027214050293 seconds +27: Time to load utils op: 0.2044663429260254 seconds +28: Time to load utils op: 0.2041316032409668 seconds +31: Time to load utils op: 0.20251226425170898 seconds +30: Time to load utils op: 0.2028791904449463 seconds +27: Time to load utils op: 0.20476174354553223 seconds +31: Time to load utils op: 0.20254206657409668 seconds +31: Time to load utils op: 0.20254802703857422 seconds +27: Time to load utils op: 0.20486187934875488 seconds +27: Time to load utils op: 0.20499110221862793 seconds +29: Time to load utils op: 0.2042524814605713 seconds +29: Time to load utils op: 0.2042388916015625 seconds +30: Time to load utils op: 0.20307278633117676 seconds +30: Time to load utils op: 0.2032167911529541 seconds +30: Time to load utils op: 0.20331931114196777 seconds +13: Time to load utils op: 0.2146892547607422 secondsTime to load utils op: 0.21483969688415527 seconds +13: Time to load utils op: 0.2145841121673584 secondsTime to load utils op: 0.21469998359680176 seconds +13: +13: +12: Time to load utils op: 0.2153487205505371 secondsTime to load utils op: 0.21499300003051758 secondsTime to load utils op: 0.21522808074951172 seconds +12: +12: +12: Time to load utils op: 0.21495723724365234 seconds +20: Time to load utils op: 0.213425874710083 secondsTime to load utils op: 0.21395230293273926 seconds +20: Time to load utils op: 0.21363210678100586 seconds +20: +20: Time to load utils op: 0.21352481842041016 seconds +21: Time to load utils op: 0.21297144889831543 secondsTime to load utils op: 0.21326017379760742 secondsTime to load utils op: 0.2129971981048584 seconds +21: +21: +21: Time to load utils op: 0.21325922012329102 seconds + 0: Time to load utils op: 0.4028501510620117 seconds + 0: Time to load utils op: 0.40265965461730957 seconds + 0: Time to load utils op: 0.4033634662628174 seconds + 4: Time to load utils op: 0.4067068099975586 seconds + 4: Time to load utils op: 0.4069247245788574 seconds + 4: Time to load utils op: 0.4067957401275635 seconds + 1: Time to load utils op: 0.40451693534851074 seconds + 4: Time to load utils op: 0.40737414360046387 seconds + 1: Time to load utils op: 0.4047226905822754 seconds + 2: Time to load utils op: 0.4048879146575928 seconds + 1: Time to load utils op: 0.4049501419067383 seconds + 2: Time to load utils op: 0.4050180912017822 seconds + 2: Time to load utils op: 0.4050626754760742 seconds + 2: Time to load utils op: 0.4051811695098877 seconds + 1: Time to load utils op: 0.4052774906158447 seconds +21: Time to load utils op: 0.40549612045288086 seconds +21: Time to load utils op: 0.40546107292175293 seconds +21: Time to load utils op: 0.40570950508117676 seconds + 6: Time to load utils op: 0.40552330017089844 seconds +12: Time to load utils op: 0.40545010566711426 seconds +21: Time to load utils op: 0.40604281425476074 seconds + 8: Time to load utils op: 0.40526604652404785 seconds + 6: Time to load utils op: 0.4056892395019531 seconds + 9: Time to load utils op: 0.40554308891296387 seconds + 9: Time to load utils op: 0.4055521488189697 seconds +12: Time to load utils op: 0.4055063724517822 seconds + 9: Time to load utils op: 0.4055953025817871 seconds + 8: Time to load utils op: 0.40538668632507324 seconds +12: Time to load utils op: 0.40562963485717773 seconds + 9: Time to load utils op: 0.4057188034057617 seconds + 8: Time to load utils op: 0.4055008888244629 seconds + 7: Time to load utils op: 0.4058694839477539 seconds +13: Time to load utils op: 0.4057893753051758 seconds +12: Time to load utils op: 0.4057292938232422 seconds + 6: Time to load utils op: 0.4059181213378906 seconds +20: Time to load utils op: 0.40601372718811035 seconds + 7: Time to load utils op: 0.40598487854003906 seconds + 8: Time to load utils op: 0.40566563606262207 seconds +10: Time to load utils op: 0.40599703788757324 seconds +13: Time to load utils op: 0.40607500076293945 seconds +13: Time to load utils op: 0.4060938358306885 seconds +20: Time to load utils op: 0.40622448921203613 seconds +20: Time to load utils op: 0.40643930435180664 seconds +11: Time to load utils op: 0.40636515617370605 seconds + 3: Time to load utils op: 0.4060330390930176 seconds +13: Time to load utils op: 0.40621089935302734 seconds +11: Time to load utils op: 0.40637683868408203 seconds + 6: Time to load utils op: 0.406343936920166 seconds + 5: Time to load utils op: 0.406130313873291 seconds + 7: Time to load utils op: 0.4062962532043457 secondsTime to load utils op: 0.4062955379486084 seconds + 7: + 5: Time to load utils op: 0.4062931537628174 seconds +11: Time to load utils op: 0.4066157341003418 seconds + 3: Time to load utils op: 0.40625548362731934 seconds +10: Time to load utils op: 0.40648436546325684 seconds + 5: Time to load utils op: 0.40642738342285156 seconds +20: Time to load utils op: 0.4069852828979492 seconds +11: Time to load utils op: 0.40677404403686523 seconds +10: Time to load utils op: 0.4065892696380615 seconds + 5: Time to load utils op: 0.40659022331237793 seconds +10: Time to load utils op: 0.40671300888061523 seconds + 3: Time to load utils op: 0.40656232833862305 seconds + 3: Time to load utils op: 0.4066441059112549 seconds + 8: Time to load utils op: 0.0006260871887207031 seconds + 8: Time to load utils op: 0.0006091594696044922 secondsTime to load utils op: 0.0006146430969238281 secondsTime to load utils op: 0.0005981922149658203 seconds + 8: + 8: + 8: Time to load utils op: 0.0005726814270019531 seconds + 8: Time to load utils op: 0.0006754398345947266 seconds + 8: Time to load utils op: 0.0006744861602783203 seconds + 8: Time to load utils op: 0.0006494522094726562 seconds + 9: Time to load utils op: 0.0009105205535888672 seconds + 9: Time to load utils op: 0.0010461807250976562 seconds + 9: Time to load utils op: 0.00101470947265625 seconds + 9: Time to load utils op: 0.0012907981872558594 secondsTime to load utils op: 0.0012638568878173828 seconds + 9: + 9: Time to load utils op: 0.001280069351196289 seconds + 9: Time to load utils op: 0.0013661384582519531 seconds + 9: Time to load utils op: 0.001397848129272461 seconds +14: Time to load utils op: 0.0004994869232177734 seconds +30: Time to load utils op: 0.0011627674102783203 seconds +14: Time to load utils op: 0.0005135536193847656 seconds +14: Time to load utils op: 0.0005779266357421875 secondsTime to load utils op: 0.0005738735198974609 seconds +14: +14: Time to load utils op: 0.0006327629089355469 seconds +14: Time to load utils op: 0.0006501674652099609 secondsTime to load utils op: 0.0006506443023681641 seconds +14: +14: Time to load utils op: 0.0006544589996337891 seconds +30: Time to load utils op: 0.001672983169555664 secondsTime to load utils op: 0.0016319751739501953 seconds +30: +30: Time to load utils op: 0.001678466796875 seconds +30: Time to load utils op: 0.0016682147979736328 seconds +30: Time to load utils op: 0.0016217231750488281 seconds +30: Time to load utils op: 0.001703023910522461 seconds +30: Time to load utils op: 0.0017273426055908203 seconds +21: Time to load utils op: 0.0007894039154052734 seconds +21: Time to load utils op: 0.0009007453918457031 seconds +21: Time to load utils op: 0.0012385845184326172 seconds +21: Time to load utils op: 0.0012125968933105469 seconds +21: Time to load utils op: 0.0012023448944091797 seconds +21: Time to load utils op: 0.0011987686157226562 seconds +21: Time to load utils op: 0.0012354850769042969 seconds +21: Time to load utils op: 0.001247406005859375 seconds + 0: [2023-04-29 10:58:38,800] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: Time to load utils op: 0.00047659873962402344 seconds + 0: Time to load utils op: 0.0005066394805908203 secondsTime to load utils op: 0.0005249977111816406 secondsTime to load utils op: 0.0005064010620117188 secondsTime to load utils op: 0.0005214214324951172 secondsTime to load utils op: 0.00047898292541503906 seconds + 0: + 0: + 0: Time to load utils op: 0.0005207061767578125 seconds + 0: + 0: + 0: [2023-04-29 10:58:38,801] [INFO] [utils.py:828:see_memory_usage] MA 4.15 GB Max_MA 4.15 GB CA 4.18 GB Max_CA 4 GB + 0: [2023-04-29 10:58:38,801] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.92 GB, percent = 8.1% +26: Time to load utils op: 0.000415802001953125 seconds +26: Time to load utils op: 0.00040030479431152344 seconds +26: Time to load utils op: 0.0005364418029785156 secondsTime to load utils op: 0.00041031837463378906 seconds +26: +26: Time to load utils op: 0.0005064010620117188 seconds +26: Time to load utils op: 0.0005393028259277344 seconds +26: Time to load utils op: 0.0005462169647216797 seconds +26: Time to load utils op: 0.0006070137023925781 seconds +23: Time to load utils op: 0.0008475780487060547 secondsTime to load utils op: 0.0008754730224609375 seconds +23: +23: Time to load utils op: 0.0009334087371826172 seconds +23: Time to load utils op: 0.0009555816650390625 seconds +23: Time to load utils op: 0.0006546974182128906 secondsTime to load utils op: 0.0005459785461425781 seconds +23: +23: Time to load utils op: 0.0005319118499755859 seconds +23: Time to load utils op: 0.0005652904510498047 seconds + 1: Time to load utils op: 0.0007190704345703125 seconds + 1: Time to load utils op: 0.0009272098541259766 seconds +15: Time to load utils op: 0.0004601478576660156 seconds +15: Time to load utils op: 0.00042700767517089844 seconds +15: Time to load utils op: 0.0005114078521728516 secondsTime to load utils op: 0.0004696846008300781 seconds +15: Time to load utils op: 0.0004062652587890625 seconds +15: Time to load utils op: 0.0004215240478515625 seconds +15: +24: Time to load utils op: 0.0005102157592773438 seconds + 1: Time to load utils op: 0.001374959945678711 seconds + 1: Time to load utils op: 0.0013630390167236328 seconds +24: Time to load utils op: 0.0005125999450683594 seconds +15: Time to load utils op: 0.00040221214294433594 seconds +15: Time to load utils op: 0.0004928112030029297 seconds + 1: Time to load utils op: 0.001409769058227539 seconds + 1: Time to load utils op: 0.0013799667358398438 seconds + 1: Time to load utils op: 0.0013356208801269531 seconds + 1: Time to load utils op: 0.0013916492462158203 seconds +24: Time to load utils op: 0.0005702972412109375 secondsTime to load utils op: 0.0005805492401123047 seconds +24: +24: Time to load utils op: 0.0005919933319091797 seconds +24: Time to load utils op: 0.0006113052368164062 secondsTime to load utils op: 0.0005993843078613281 secondsTime to load utils op: 0.0006327629089355469 seconds +24: +24: +18: Time to load utils op: 0.0005271434783935547 seconds +18: Time to load utils op: 0.0005359649658203125 seconds +18: Time to load utils op: 0.0005540847778320312 seconds +18: Time to load utils op: 0.0005402565002441406 seconds +18: Time to load utils op: 0.0006163120269775391 seconds +18: Time to load utils op: 0.0006692409515380859 secondsTime to load utils op: 0.0006549358367919922 seconds +18: +18: Time to load utils op: 0.000690460205078125 seconds +22: Time to load utils op: 0.0006821155548095703 seconds +22: Time to load utils op: 0.0008604526519775391 seconds +22: Time to load utils op: 0.0008509159088134766 seconds +22: Time to load utils op: 0.0009450912475585938 seconds +22: Time to load utils op: 0.0011169910430908203 seconds +22: Time to load utils op: 0.0010919570922851562 seconds +22: Time to load utils op: 0.001093149185180664 seconds +22: Time to load utils op: 0.0011768341064453125 seconds +17: Time to load utils op: 0.0005075931549072266 seconds +17: Time to load utils op: 0.0005221366882324219 seconds + 3: Time to load utils op: 0.0009427070617675781 seconds +17: Time to load utils op: 0.0005249977111816406 seconds +17: Time to load utils op: 0.0006153583526611328 secondsTime to load utils op: 0.0006139278411865234 secondsTime to load utils op: 0.0006437301635742188 secondsTime to load utils op: 0.0006406307220458984 seconds +17: Time to load utils op: 0.0006368160247802734 seconds +17: +17: +17: + 6: Time to load utils op: 0.0009584426879882812 seconds + 3: Time to load utils op: 0.0010986328125 seconds +11: Time to load utils op: 0.0005409717559814453 secondsTime to load utils op: 0.0005550384521484375 secondsTime to load utils op: 0.0005688667297363281 secondsTime to load utils op: 0.0005676746368408203 seconds +11: +11: +11: + 6: Time to load utils op: 0.0013401508331298828 seconds + 3: Time to load utils op: 0.0014569759368896484 seconds +11: Time to load utils op: 0.0006225109100341797 secondsTime to load utils op: 0.0006120204925537109 secondsTime to load utils op: 0.0006234645843505859 seconds +11: +11: + 6: Time to load utils op: 0.0013294219970703125 secondsTime to load utils op: 0.0013051033020019531 seconds + 6: Time to load utils op: 0.0013709068298339844 seconds + 6: + 6: Time to load utils op: 0.0013630390167236328 seconds +11: Time to load utils op: 0.0005936622619628906 seconds + 3: Time to load utils op: 0.0015010833740234375 secondsTime to load utils op: 0.00145721435546875 seconds + 3: + 6: Time to load utils op: 0.0013370513916015625 seconds + 3: Time to load utils op: 0.0014710426330566406 seconds + 3: Time to load utils op: 0.0014715194702148438 seconds + 6: Time to load utils op: 0.0013992786407470703 seconds +31: Time to load utils op: 0.0005567073822021484 seconds + 3: Time to load utils op: 0.0015189647674560547 seconds + 5: Time to load utils op: 0.0008704662322998047 seconds +31: Time to load utils op: 0.000591278076171875 seconds +31: Time to load utils op: 0.0005409717559814453 seconds +31: Time to load utils op: 0.0005972385406494141 seconds +31: Time to load utils op: 0.0005922317504882812 seconds +31: Time to load utils op: 0.0005667209625244141 seconds +31: Time to load utils op: 0.0006062984466552734 seconds + 4: Time to load utils op: 0.0005023479461669922 seconds +31: Time to load utils op: 0.0006260871887207031 seconds + 4: Time to load utils op: 0.0005314350128173828 seconds +28: Time to load utils op: 0.0005908012390136719 seconds + 5: Time to load utils op: 0.0011255741119384766 seconds + 5: Time to load utils op: 0.0011229515075683594 seconds + 5: Time to load utils op: 0.0011985301971435547 seconds + 4: Time to load utils op: 0.0005650520324707031 seconds +28: Time to load utils op: 0.0005824565887451172 secondsTime to load utils op: 0.0005743503570556641 seconds +28: + 5: Time to load utils op: 0.0011363029479980469 seconds + 4: Time to load utils op: 0.0005519390106201172 secondsTime to load utils op: 0.0005929470062255859 seconds + 4: + 4: Time to load utils op: 0.0006136894226074219 secondsTime to load utils op: 0.0005917549133300781 seconds + 4: +28: Time to load utils op: 0.0005872249603271484 seconds + 4: Time to load utils op: 0.0005965232849121094 seconds + 5: Time to load utils op: 0.0011508464813232422 seconds + 5: Time to load utils op: 0.001155853271484375 seconds +28: Time to load utils op: 0.0006091594696044922 secondsTime to load utils op: 0.0005939006805419922 seconds +28: + 5: Time to load utils op: 0.0012052059173583984 seconds +28: Time to load utils op: 0.0006062984466552734 seconds +28: Time to load utils op: 0.0006594657897949219 seconds +27: Time to load utils op: 0.0005564689636230469 seconds +27: Time to load utils op: 0.0005664825439453125 seconds +27: Time to load utils op: 0.0005652904510498047 seconds +27: Time to load utils op: 0.0005972385406494141 seconds +27: Time to load utils op: 0.0006158351898193359 seconds +27: Time to load utils op: 0.0006198883056640625 secondsTime to load utils op: 0.0006349086761474609 seconds +27: +27: Time to load utils op: 0.0006387233734130859 seconds +16: Time to load utils op: 0.0012853145599365234 seconds +16: Time to load utils op: 0.0013642311096191406 seconds +19: Time to load utils op: 0.0005967617034912109 secondsTime to load utils op: 0.0006177425384521484 seconds +19: +19: Time to load utils op: 0.0005908012390136719 seconds +12: Time to load utils op: 0.0005931854248046875 seconds +16: Time to load utils op: 0.0014834403991699219 seconds +10: Time to load utils op: 0.0006868839263916016 seconds +10: Time to load utils op: 0.0006716251373291016 seconds +19: Time to load utils op: 0.0006563663482666016 secondsTime to load utils op: 0.0006806850433349609 seconds +19: +19: Time to load utils op: 0.0006589889526367188 seconds +19: Time to load utils op: 0.0006206035614013672 seconds +12: Time to load utils op: 0.0005936622619628906 seconds +16: Time to load utils op: 0.0014753341674804688 seconds +16: Time to load utils op: 0.0015218257904052734 seconds +19: Time to load utils op: 0.0006809234619140625 seconds +16: Time to load utils op: 0.0014886856079101562 seconds +10: Time to load utils op: 0.0007872581481933594 seconds +10: Time to load utils op: 0.0007836818695068359 seconds +12: Time to load utils op: 0.0006074905395507812 seconds +16: Time to load utils op: 0.0015065670013427734 seconds + 7: Time to load utils op: 0.00041675567626953125 seconds +16: Time to load utils op: 0.0015881061553955078 seconds +29: Time to load utils op: 0.0012063980102539062 seconds + 7: Time to load utils op: 0.0004863739013671875 seconds + 7: Time to load utils op: 0.00040721893310546875 seconds +12: Time to load utils op: 0.0006058216094970703 seconds +20: Time to load utils op: 0.0005548000335693359 seconds +10: Time to load utils op: 0.0010271072387695312 seconds +12: Time to load utils op: 0.0005660057067871094 seconds + 7: Time to load utils op: 0.0005540847778320312 seconds +13: Time to load utils op: 0.0011534690856933594 secondsTime to load utils op: 0.0011246204376220703 seconds +13: +12: Time to load utils op: 0.0006399154663085938 secondsTime to load utils op: 0.0007014274597167969 seconds +12: Time to load utils op: 0.0006492137908935547 seconds +12: +20: Time to load utils op: 0.0004553794860839844 seconds + 7: Time to load utils op: 0.0006039142608642578 seconds +20: Time to load utils op: 0.0004456043243408203 seconds + 7: Time to load utils op: 0.0006134510040283203 secondsTime to load utils op: 0.0006268024444580078 seconds + 7: + 7: Time to load utils op: 0.0006341934204101562 seconds +20: Time to load utils op: 0.0004830360412597656 seconds +10: Time to load utils op: 0.0011568069458007812 secondsTime to load utils op: 0.0011401176452636719 seconds +10: +29: Time to load utils op: 0.0014264583587646484 seconds +20: Time to load utils op: 0.00044345855712890625 seconds +29: Time to load utils op: 0.0014290809631347656 seconds +20: Time to load utils op: 0.0005762577056884766 seconds +10: Time to load utils op: 0.0011444091796875 seconds +20: Time to load utils op: 0.00046706199645996094 seconds +29: Time to load utils op: 0.0014548301696777344 seconds +20: Time to load utils op: 0.0004668235778808594 seconds +29: Time to load utils op: 0.0014338493347167969 secondsTime to load utils op: 0.0014717578887939453 seconds +29: +13: Time to load utils op: 0.0014371871948242188 seconds +29: Time to load utils op: 0.0015020370483398438 seconds +13: Time to load utils op: 0.0013616085052490234 seconds +13: Time to load utils op: 0.0013611316680908203 secondsTime to load utils op: 0.0013532638549804688 seconds +13: +29: Time to load utils op: 0.0015141963958740234 seconds +13: Time to load utils op: 0.001444101333618164 seconds +13: Time to load utils op: 0.0013890266418457031 seconds +25: Time to load utils op: 0.00047326087951660156 seconds +25: Time to load utils op: 0.0007529258728027344 seconds +25: Time to load utils op: 0.0004837512969970703 secondsTime to load utils op: 0.000484466552734375 seconds +25: +25: Time to load utils op: 0.0007741451263427734 seconds +25: Time to load utils op: 0.0004832744598388672 secondsTime to load utils op: 0.0005300045013427734 seconds +25: +25: Time to load utils op: 0.0004951953887939453 seconds + 2: Time to load utils op: 0.002148866653442383 seconds + 2: Time to load utils op: 0.00255584716796875 seconds + 2: Time to load utils op: 0.002605438232421875 seconds + 2: Time to load utils op: 0.002585172653198242 secondsTime to load utils op: 0.002589702606201172 seconds + 2: + 2: Time to load utils op: 0.0025472640991210938 seconds + 2: Time to load utils op: 0.002579212188720703 seconds + 2: Time to load utils op: 0.00264739990234375 seconds + 0: [2023-04-29 10:58:38,921] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-04-29 10:58:38,922] [INFO] [utils.py:828:see_memory_usage] MA 8.44 GB Max_MA 8.44 GB CA 10.57 GB Max_CA 11 GB + 0: [2023-04-29 10:58:38,922] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.05 GB, percent = 8.2% + 0: [2023-04-29 10:58:39,031] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-04-29 10:58:39,032] [INFO] [utils.py:828:see_memory_usage] MA 8.44 GB Max_MA 8.44 GB CA 10.57 GB Max_CA 11 GB + 0: [2023-04-29 10:58:39,032] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.13 GB, percent = 8.2% + 0: [2023-04-29 10:58:39,144] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-04-29 10:58:39,145] [INFO] [utils.py:828:see_memory_usage] MA 12.5 GB Max_MA 12.5 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,145] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.22 GB, percent = 8.2% + 0: [2023-04-29 10:58:39,255] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-04-29 10:58:39,255] [INFO] [utils.py:828:see_memory_usage] MA 12.5 GB Max_MA 12.5 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,255] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.29 GB, percent = 8.2% + 0: [2023-04-29 10:58:39,369] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-04-29 10:58:39,369] [INFO] [utils.py:828:see_memory_usage] MA 12.51 GB Max_MA 12.51 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,369] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.36 GB, percent = 8.2% +57: ninja: no work to do. +57: Time to load utils op: 0.2165215015411377 secondsTime to load utils op: 0.21655607223510742 secondsTime to load utils op: 0.21654462814331055 seconds +57: +57: +57: Time to load utils op: 0.2165815830230713 seconds +32: Time to load utils op: 0.20791411399841309 secondsTime to load utils op: 0.20792484283447266 seconds +32: +32: Time to load utils op: 0.20804500579833984 seconds +33: Time to load utils op: 0.20895934104919434 secondsTime to load utils op: 0.209242582321167 secondsTime to load utils op: 0.20902609825134277 seconds +33: +33: +33: Time to load utils op: 0.20899367332458496 seconds +34: Time to load utils op: 0.21081304550170898 secondsTime to load utils op: 0.21093034744262695 secondsTime to load utils op: 0.21050572395324707 secondsTime to load utils op: 0.21049165725708008 seconds +34: +34: +34: +36: Time to load utils op: 0.20926952362060547 secondsTime to load utils op: 0.2096402645111084 secondsTime to load utils op: 0.20966529846191406 seconds +36: +36: +36: Time to load utils op: 0.20986700057983398 seconds +35: Time to load utils op: 0.20968294143676758 seconds +35: Time to load utils op: 0.20939016342163086 seconds +35: Time to load utils op: 0.20943331718444824 seconds +35: Time to load utils op: 0.20940017700195312 seconds +37: Time to load utils op: 0.21010518074035645 secondsTime to load utils op: 0.20908236503601074 secondsTime to load utils op: 0.20989704132080078 seconds +37: +37: Time to load utils op: 0.20927834510803223 seconds +37: +39: Time to load utils op: 0.20851564407348633 seconds +39: Time to load utils op: 0.20958375930786133 seconds +39: Time to load utils op: 0.2086164951324463 secondsTime to load utils op: 0.20863986015319824 seconds +39: +38: Time to load utils op: 0.21006345748901367 secondsTime to load utils op: 0.21024775505065918 seconds +38: Time to load utils op: 0.21027040481567383 seconds +38: +38: Time to load utils op: 0.21024584770202637 seconds +42: Time to load utils op: 0.20908117294311523 secondsTime to load utils op: 0.209061861038208 secondsTime to load utils op: 0.20907092094421387 secondsTime to load utils op: 0.20887231826782227 seconds +42: +42: +42: +41: Time to load utils op: 0.20931768417358398 secondsTime to load utils op: 0.20935654640197754 secondsTime to load utils op: 0.209367036819458 seconds +41: +41: Time to load utils op: 0.2093815803527832 seconds +41: +40: Time to load utils op: 0.21055340766906738 secondsTime to load utils op: 0.21047091484069824 secondsTime to load utils op: 0.2105855941772461 seconds +40: +40: +40: Time to load utils op: 0.2106013298034668 seconds +43: Time to load utils op: 0.20949459075927734 secondsTime to load utils op: 0.20950102806091309 seconds +43: +43: Time to load utils op: 0.20961475372314453 seconds +43: Time to load utils op: 0.20948147773742676 seconds +57: Time to load utils op: 0.20226478576660156 seconds +57: Time to load utils op: 0.202134370803833 seconds +44: Time to load utils op: 0.2094581127166748 secondsTime to load utils op: 0.20975422859191895 seconds +44: Time to load utils op: 0.2098221778869629 secondsTime to load utils op: 0.20939421653747559 seconds +44: +44: +57: Time to load utils op: 0.20265555381774902 seconds +57: Time to load utils op: 0.20242071151733398 seconds +45: Time to load utils op: 0.20956778526306152 secondsTime to load utils op: 0.20957136154174805 seconds +45: Time to load utils op: 0.20955848693847656 secondsTime to load utils op: 0.20973730087280273 seconds +45: +45: +48: Time to load utils op: 0.20970821380615234 secondsTime to load utils op: 0.2097620964050293 secondsTime to load utils op: 0.20981955528259277 secondsTime to load utils op: 0.20944428443908691 seconds +48: +48: +48: +49: Time to load utils op: 0.20856785774230957 secondsTime to load utils op: 0.2086029052734375 secondsTime to load utils op: 0.20892000198364258 seconds +49: +49: Time to load utils op: 0.2089223861694336 seconds +49: +46: Time to load utils op: 0.21105504035949707 secondsTime to load utils op: 0.21106743812561035 seconds +46: Time to load utils op: 0.21111106872558594 seconds +46: +46: Time to load utils op: 0.2110579013824463 seconds +47: Time to load utils op: 0.2102973461151123 secondsTime to load utils op: 0.21030712127685547 secondsTime to load utils op: 0.21031522750854492 secondsTime to load utils op: 0.21027827262878418 seconds +47: +47: +47: +50: Time to load utils op: 0.20952677726745605 secondsTime to load utils op: 0.20929169654846191 secondsTime to load utils op: 0.20983076095581055 seconds +50: +50: +50: Time to load utils op: 0.20953774452209473 seconds +52: Time to load utils op: 0.20938539505004883 secondsTime to load utils op: 0.20941519737243652 seconds +52: Time to load utils op: 0.2095048427581787 seconds +52: +52: Time to load utils op: 0.20955681800842285 seconds +53: Time to load utils op: 0.20941805839538574 secondsTime to load utils op: 0.20939183235168457 seconds +53: Time to load utils op: 0.20954489707946777 secondsTime to load utils op: 0.20943045616149902 seconds +53: +53: +54: Time to load utils op: 0.2098531723022461 secondsTime to load utils op: 0.20957660675048828 secondsTime to load utils op: 0.2095334529876709 seconds +54: +54: +54: Time to load utils op: 0.20954227447509766 seconds +56: Time to load utils op: 0.20825576782226562 secondsTime to load utils op: 0.2082531452178955 seconds +56: +56: Time to load utils op: 0.208709716796875 secondsTime to load utils op: 0.20830202102661133 seconds +56: +55: Time to load utils op: 0.20955657958984375 seconds +55: Time to load utils op: 0.2098531723022461 secondsTime to load utils op: 0.20972537994384766 seconds +55: +55: Time to load utils op: 0.20972752571105957 seconds +60: Time to load utils op: 0.20772051811218262 secondsTime to load utils op: 0.2080245018005371 secondsTime to load utils op: 0.2077944278717041 seconds +60: +60: +60: Time to load utils op: 0.20779943466186523 seconds +58: Time to load utils op: 0.20848870277404785 secondsTime to load utils op: 0.2081606388092041 seconds +58: +58: Time to load utils op: 0.20819473266601562 secondsTime to load utils op: 0.2081902027130127 seconds +58: +59: Time to load utils op: 0.20904779434204102 secondsTime to load utils op: 0.20903396606445312 secondsTime to load utils op: 0.20905327796936035 secondsTime to load utils op: 0.20902085304260254 seconds +59: +59: +59: +61: Time to load utils op: 0.2086782455444336 secondsTime to load utils op: 0.20891356468200684 seconds +61: Time to load utils op: 0.20873284339904785 seconds +61: Time to load utils op: 0.2087552547454834 seconds +61: +51: Time to load utils op: 0.21479415893554688 secondsTime to load utils op: 0.21458220481872559 seconds +51: +51: Time to load utils op: 0.21457147598266602 seconds +51: Time to load utils op: 0.2145521640777588 seconds +62: Time to load utils op: 0.20846223831176758 seconds +62: Time to load utils op: 0.20845556259155273 secondsTime to load utils op: 0.20844101905822754 seconds +62: +62: Time to load utils op: 0.20847082138061523 seconds +63: Time to load utils op: 0.20804286003112793 secondsTime to load utils op: 0.2083268165588379 secondsTime to load utils op: 0.20816659927368164 seconds +63: +63: +63: Time to load utils op: 0.2084352970123291 seconds +32: Time to load utils op: 0.000461578369140625 seconds +32: Time to load utils op: 0.0005061626434326172 seconds +32: Time to load utils op: 0.0005190372467041016 seconds +36: Time to load utils op: 0.0005393028259277344 secondsTime to load utils op: 0.0005543231964111328 secondsTime to load utils op: 0.0005545616149902344 secondsTime to load utils op: 0.0005602836608886719 seconds +36: +36: +36: +57: Time to load utils op: 0.0005533695220947266 seconds +57: Time to load utils op: 0.0005593299865722656 seconds +57: Time to load utils op: 0.0004985332489013672 seconds +57: Time to load utils op: 0.0005974769592285156 secondsTime to load utils op: 0.0006175041198730469 seconds +57: +57: Time to load utils op: 0.0006356239318847656 seconds +57: Time to load utils op: 0.0006325244903564453 seconds +57: Time to load utils op: 0.0005192756652832031 seconds +33: Time to load utils op: 0.0005135536193847656 seconds +33: Time to load utils op: 0.0004951953887939453 seconds +33: Time to load utils op: 0.0005114078521728516 seconds +33: Time to load utils op: 0.0005252361297607422 seconds +32: Time to load utils op: 0.30396032333374023 seconds +35: Time to load utils op: 0.0004990100860595703 seconds +35: Time to load utils op: 0.00046563148498535156 seconds +35: Time to load utils op: 0.0005025863647460938 seconds +35: Time to load utils op: 0.0005083084106445312 seconds +39: Time to load utils op: 0.0004994869232177734 seconds +39: Time to load utils op: 0.0005404949188232422 seconds +39: Time to load utils op: 0.0004971027374267578 seconds +39: Time to load utils op: 0.0005345344543457031 seconds +38: Time to load utils op: 0.000514984130859375 seconds +38: Time to load utils op: 0.0005490779876708984 seconds +38: Time to load utils op: 0.0005624294281005859 seconds +38: Time to load utils op: 0.0005586147308349609 seconds +34: Time to load utils op: 0.00048089027404785156 secondsTime to load utils op: 0.00048613548278808594 seconds +34: +34: Time to load utils op: 0.0003790855407714844 seconds +34: Time to load utils op: 0.0004951953887939453 seconds +42: Time to load utils op: 0.0005090236663818359 seconds +42: Time to load utils op: 0.0005061626434326172 seconds +42: Time to load utils op: 0.0004894733428955078 seconds +42: Time to load utils op: 0.0005199909210205078 seconds +37: Time to load utils op: 0.0005033016204833984 seconds +37: Time to load utils op: 0.00051116943359375 secondsTime to load utils op: 0.0005533695220947266 seconds +37: +37: Time to load utils op: 0.0005221366882324219 seconds +41: Time to load utils op: 0.0005042552947998047 seconds +41: Time to load utils op: 0.0005090236663818359 seconds +41: Time to load utils op: 0.0005211830139160156 seconds +41: Time to load utils op: 0.0005166530609130859 seconds +32: Time to load utils op: 0.30223941802978516 seconds +32: Time to load utils op: 0.30254220962524414 seconds +32: Time to load utils op: 0.302473783493042 seconds + 0: [2023-04-29 10:58:39,480] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer +43: Time to load utils op: 0.0005307197570800781 seconds +43: Time to load utils op: 0.0005576610565185547 seconds +43: Time to load utils op: 0.0005772113800048828 secondsTime to load utils op: 0.0005815029144287109 seconds +43: + 0: [2023-04-29 10:58:39,481] [INFO] [utils.py:828:see_memory_usage] MA 12.51 GB Max_MA 12.51 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,481] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.41 GB, percent = 8.2% +48: Time to load utils op: 0.00046539306640625 seconds +48: Time to load utils op: 0.0005240440368652344 secondsTime to load utils op: 0.0005207061767578125 seconds +48: Time to load utils op: 0.0005140304565429688 seconds +48: +34: Time to load utils op: 0.30558276176452637 seconds +60: Time to load utils op: 0.0005249977111816406 seconds +60: Time to load utils op: 0.0005469322204589844 seconds +60: Time to load utils op: 0.0005693435668945312 seconds +34: Time to load utils op: 0.3050200939178467 seconds +34: Time to load utils op: 0.3055248260498047 secondsTime to load utils op: 0.30558180809020996 seconds +34: +60: Time to load utils op: 0.0005555152893066406 seconds +37: Time to load utils op: 0.30353593826293945 seconds +37: Time to load utils op: 0.3042306900024414 seconds +49: Time to load utils op: 0.0004911422729492188 seconds +37: Time to load utils op: 0.3040885925292969 seconds +49: Time to load utils op: 0.0005338191986083984 seconds +37: Time to load utils op: 0.30475449562072754 seconds +49: Time to load utils op: 0.0005307197570800781 seconds +49: Time to load utils op: 0.0005471706390380859 seconds +36: Time to load utils op: 0.30550670623779297 seconds +36: Time to load utils op: 0.3050425052642822 seconds +36: Time to load utils op: 0.3054041862487793 seconds +36: Time to load utils op: 0.30576205253601074 seconds +44: Time to load utils op: 0.0005025863647460938 seconds +44: Time to load utils op: 0.0005192756652832031 secondsTime to load utils op: 0.0005404949188232422 seconds +44: +44: Time to load utils op: 0.0007333755493164062 seconds +45: Time to load utils op: 0.0005135536193847656 seconds +45: Time to load utils op: 0.0005347728729248047 secondsTime to load utils op: 0.0005371570587158203 seconds +45: +45: Time to load utils op: 0.0005621910095214844 seconds +47: Time to load utils op: 0.0005211830139160156 seconds +47: Time to load utils op: 0.0005159378051757812 secondsTime to load utils op: 0.0005166530609130859 seconds +47: +47: Time to load utils op: 0.00047516822814941406 seconds +39: Time to load utils op: 0.3043394088745117 secondsTime to load utils op: 0.30434751510620117 seconds +39: +39: Time to load utils op: 0.30479979515075684 seconds +39: Time to load utils op: 0.3046605587005615 seconds +32: Time to load utils op: 0.0003476142883300781 seconds +35: Time to load utils op: 0.3046097755432129 seconds +33: Time to load utils op: 0.30530762672424316 seconds +33: Time to load utils op: 0.3053145408630371 seconds +33: Time to load utils op: 0.30533409118652344 secondsTime to load utils op: 0.30533814430236816 seconds +33: +35: Time to load utils op: 0.30472612380981445 seconds +35: Time to load utils op: 0.30473828315734863 seconds +35: Time to load utils op: 0.30481696128845215 seconds +44: Time to load utils op: 0.30496692657470703 secondsTime to load utils op: 0.30493903160095215 seconds +44: +44: Time to load utils op: 0.3049814701080322 seconds +44: Time to load utils op: 0.3052403926849365 seconds +38: Time to load utils op: 0.3048238754272461 secondsTime to load utils op: 0.3048269748687744 seconds +38: +38: Time to load utils op: 0.3049163818359375 seconds +38: Time to load utils op: 0.30493831634521484 seconds +40: Time to load utils op: 0.3047220706939697 seconds +40: Time to load utils op: 0.3048982620239258 seconds +40: Time to load utils op: 0.3050112724304199 seconds +41: Time to load utils op: 0.30466437339782715 secondsTime to load utils op: 0.30466437339782715 seconds +41: +41: Time to load utils op: 0.3047327995300293 secondsTime to load utils op: 0.30473852157592773 seconds +41: +40: Time to load utils op: 0.3053781986236572 seconds +40: Time to load utils op: 0.0004975795745849609 seconds +51: Time to load utils op: 0.0005128383636474609 seconds +51: Time to load utils op: 0.0005230903625488281 seconds +40: Time to load utils op: 0.0005407333374023438 secondsTime to load utils op: 0.0005679130554199219 seconds +40: +40: Time to load utils op: 0.0006003379821777344 seconds +51: Time to load utils op: 0.0005204677581787109 seconds +50: Time to load utils op: 0.3049769401550293 seconds +51: Time to load utils op: 0.0005285739898681641 seconds +42: Time to load utils op: 0.30530714988708496 seconds +42: Time to load utils op: 0.30536794662475586 seconds +50: Time to load utils op: 0.30530261993408203 seconds +50: Time to load utils op: 0.3051440715789795 seconds +43: Time to load utils op: 0.30521416664123535 seconds +43: Time to load utils op: 0.30524444580078125 seconds +43: Time to load utils op: 0.30524134635925293 seconds +43: Time to load utils op: 0.30525898933410645 seconds +42: Time to load utils op: 0.30545949935913086 secondsTime to load utils op: 0.30545878410339355 seconds +42: +47: Time to load utils op: 0.3046121597290039 seconds +47: Time to load utils op: 0.30460619926452637 seconds +50: Time to load utils op: 0.3052980899810791 seconds +45: Time to load utils op: 0.3046298027038574 secondsTime to load utils op: 0.3046271800994873 seconds +45: +45: Time to load utils op: 0.30463600158691406 seconds +45: Time to load utils op: 0.30464863777160645 seconds +47: Time to load utils op: 0.3048865795135498 secondsTime to load utils op: 0.3048827648162842 seconds +47: +46: Time to load utils op: 0.3049490451812744 seconds +46: Time to load utils op: 0.3050272464752197 seconds +46: Time to load utils op: 0.30527472496032715 seconds +46: Time to load utils op: 0.3054463863372803 seconds +53: Time to load utils op: 0.0005207061767578125 seconds +53: Time to load utils op: 0.0004994869232177734 seconds +48: Time to load utils op: 0.30446338653564453 seconds +53: Time to load utils op: 0.0005333423614501953 seconds +53: Time to load utils op: 0.0004906654357910156 seconds +48: Time to load utils op: 0.30450987815856934 secondsTime to load utils op: 0.30451107025146484 seconds +48: +48: Time to load utils op: 0.3045320510864258 seconds +32: Time to load utils op: 0.30230212211608887 seconds +52: Time to load utils op: 0.00047326087951660156 seconds +52: Time to load utils op: 0.0004913806915283203 secondsTime to load utils op: 0.000492095947265625 seconds +52: +50: Time to load utils op: 0.0003669261932373047 seconds +50: Time to load utils op: 0.0005145072937011719 seconds +50: Time to load utils op: 0.00048470497131347656 seconds +50: Time to load utils op: 0.0005567073822021484 seconds +54: Time to load utils op: 0.0005104541778564453 seconds +54: Time to load utils op: 0.0005362033843994141 seconds +49: Time to load utils op: 0.3049907684326172 seconds +54: Time to load utils op: 0.0005340576171875 seconds +49: Time to load utils op: 0.3050382137298584 secondsTime to load utils op: 0.3050506114959717 seconds +49: +54: Time to load utils op: 0.0004048347473144531 seconds +49: Time to load utils op: 0.30514073371887207 seconds +52: Time to load utils op: 0.00048089027404785156 seconds +54: Time to load utils op: 0.30475783348083496 seconds +51: Time to load utils op: 0.3048982620239258 seconds +54: Time to load utils op: 0.3048398494720459 seconds +54: Time to load utils op: 0.30489110946655273 seconds +51: Time to load utils op: 0.30529069900512695 secondsTime to load utils op: 0.3052866458892822 seconds +51: +51: Time to load utils op: 0.30531907081604004 seconds +32: Time to load utils op: 0.0003440380096435547 seconds +54: Time to load utils op: 0.3052980899810791 seconds +61: Time to load utils op: 0.0005507469177246094 seconds +61: Time to load utils op: 0.0005660057067871094 seconds +61: Time to load utils op: 0.0005621910095214844 seconds +61: Time to load utils op: 0.0005173683166503906 seconds +53: Time to load utils op: 0.30497217178344727 seconds +53: Time to load utils op: 0.3050105571746826 seconds +32: Time to load utils op: 0.0003349781036376953 seconds +55: Time to load utils op: 0.0005524158477783203 seconds +58: Time to load utils op: 0.00047206878662109375 seconds +55: Time to load utils op: 0.0005660057067871094 seconds +55: Time to load utils op: 0.0005869865417480469 seconds +55: Time to load utils op: 0.0005772113800048828 seconds +53: Time to load utils op: 0.30518078804016113 seconds +53: Time to load utils op: 0.30521416664123535 seconds +58: Time to load utils op: 0.0004949569702148438 seconds +58: Time to load utils op: 0.0005207061767578125 seconds +32: Time to load utils op: 0.00037026405334472656 seconds +58: Time to load utils op: 0.0005395412445068359 seconds +56: Time to load utils op: 0.3052802085876465 seconds +56: Time to load utils op: 0.0004894733428955078 seconds +59: Time to load utils op: 0.0005095005035400391 seconds +56: Time to load utils op: 0.3053734302520752 secondsTime to load utils op: 0.0005044937133789062 seconds +56: +56: Time to load utils op: 0.00047397613525390625 seconds +59: Time to load utils op: 0.0005435943603515625 seconds +59: Time to load utils op: 0.0005445480346679688 secondsTime to load utils op: 0.0005359649658203125 seconds +59: +55: Time to load utils op: 0.30544447898864746 seconds +56: Time to load utils op: 0.30542612075805664 seconds +56: Time to load utils op: 0.0005159378051757812 seconds +56: Time to load utils op: 0.3055546283721924 seconds +46: Time to load utils op: 0.0005006790161132812 secondsTime to load utils op: 0.0004706382751464844 seconds +46: +55: Time to load utils op: 0.305757999420166 seconds +46: Time to load utils op: 0.0005090236663818359 seconds +46: Time to load utils op: 0.0005404949188232422 seconds +55: Time to load utils op: 0.3058815002441406 seconds +55: Time to load utils op: 0.3059689998626709 seconds +62: Time to load utils op: 0.0005164146423339844 seconds +62: Time to load utils op: 0.0005674362182617188 seconds +62: Time to load utils op: 0.0005376338958740234 seconds +62: Time to load utils op: 0.0005345344543457031 seconds +52: Time to load utils op: 0.30454230308532715 seconds +52: Time to load utils op: 0.30455636978149414 seconds +52: Time to load utils op: 0.3045613765716553 seconds +52: Time to load utils op: 0.3046414852142334 seconds +34: Time to load utils op: 0.00034928321838378906 seconds +37: Time to load utils op: 0.0003535747528076172 seconds +37: Time to load utils op: 0.0003685951232910156 seconds +37: Time to load utils op: 0.00038433074951171875 seconds +36: Time to load utils op: 0.00039505958557128906 seconds +34: Time to load utils op: 0.00039768218994140625 seconds +37: Time to load utils op: 0.0003542900085449219 seconds +34: Time to load utils op: 0.0003666877746582031 seconds +36: Time to load utils op: 0.00038933753967285156 secondsTime to load utils op: 0.00039458274841308594 seconds +36: +34: Time to load utils op: 0.00036525726318359375 seconds +36: Time to load utils op: 0.00040984153747558594 seconds +59: Time to load utils op: 0.3080151081085205 secondsTime to load utils op: 0.30802106857299805 seconds +59: +58: Time to load utils op: 0.3084263801574707 seconds +59: Time to load utils op: 0.30806660652160645 seconds +58: Time to load utils op: 0.30844569206237793 seconds +58: Time to load utils op: 0.3085157871246338 seconds +59: Time to load utils op: 0.3083627223968506 seconds +58: Time to load utils op: 0.3087749481201172 seconds +39: Time to load utils op: 0.0003790855407714844 seconds +61: Time to load utils op: 0.30695438385009766 seconds +39: Time to load utils op: 0.00035119056701660156 seconds +39: Time to load utils op: 0.00038886070251464844 seconds +61: Time to load utils op: 0.30712032318115234 seconds +61: Time to load utils op: 0.3072316646575928 secondsTime to load utils op: 0.3072471618652344 seconds +61: +62: Time to load utils op: 0.3063228130340576 seconds +60: Time to load utils op: 0.30731797218322754 secondsTime to load utils op: 0.3073239326477051 seconds +60: +60: Time to load utils op: 0.3073098659515381 secondsTime to load utils op: 0.3073253631591797 seconds +60: +39: Time to load utils op: 0.0003790855407714844 seconds +62: Time to load utils op: 0.3066987991333008 secondsTime to load utils op: 0.3066902160644531 seconds +62: +62: Time to load utils op: 0.30672502517700195 seconds +33: Time to load utils op: 0.0003695487976074219 seconds +33: Time to load utils op: 0.00038814544677734375 seconds +33: Time to load utils op: 0.00041103363037109375 secondsTime to load utils op: 0.00042510032653808594 seconds +33: +63: Time to load utils op: 0.0005097389221191406 seconds +63: Time to load utils op: 0.0005574226379394531 seconds +63: Time to load utils op: 0.0005261898040771484 secondsTime to load utils op: 0.0005571842193603516 seconds +63: +44: Time to load utils op: 0.0003387928009033203 seconds +44: Time to load utils op: 0.0004343986511230469 seconds +44: Time to load utils op: 0.0003895759582519531 seconds +44: Time to load utils op: 0.00042724609375 seconds +35: Time to load utils op: 0.0004036426544189453 seconds +35: Time to load utils op: 0.00036644935607910156 seconds +35: Time to load utils op: 0.00039076805114746094 seconds +35: Time to load utils op: 0.00038361549377441406 seconds +38: Time to load utils op: 0.00037598609924316406 seconds +38: Time to load utils op: 0.00040531158447265625 seconds +38: Time to load utils op: 0.0003986358642578125 seconds +38: Time to load utils op: 0.0003712177276611328 seconds +40: Time to load utils op: 0.0003712177276611328 seconds +40: Time to load utils op: 0.00035858154296875 seconds +40: Time to load utils op: 0.000347137451171875 seconds +40: Time to load utils op: 0.000362396240234375 seconds +63: Time to load utils op: 0.30625176429748535 seconds +63: Time to load utils op: 0.3062314987182617 seconds +41: Time to load utils op: 0.00035762786865234375 seconds +63: Time to load utils op: 0.3062872886657715 seconds +63: Time to load utils op: 0.3063340187072754 seconds +41: Time to load utils op: 0.00036907196044921875 seconds +41: Time to load utils op: 0.000385284423828125 seconds +41: Time to load utils op: 0.0003838539123535156 seconds +50: Time to load utils op: 0.0003807544708251953 seconds +42: Time to load utils op: 0.00036025047302246094 seconds +50: Time to load utils op: 0.0004029273986816406 seconds +45: Time to load utils op: 0.00039839744567871094 seconds +43: Time to load utils op: 0.00035858154296875 seconds +42: Time to load utils op: 0.00035953521728515625 seconds +47: Time to load utils op: 0.00037789344787597656 seconds +48: Time to load utils op: 0.00034809112548828125 seconds +46: Time to load utils op: 0.0003669261932373047 seconds +50: Time to load utils op: 0.0003821849822998047 seconds +50: Time to load utils op: 0.0003616809844970703 seconds +46: Time to load utils op: 0.000354766845703125 seconds +45: Time to load utils op: 0.00038623809814453125 seconds +45: Time to load utils op: 0.0003674030303955078 seconds +47: Time to load utils op: 0.0003459453582763672 seconds +45: Time to load utils op: 0.0003571510314941406 seconds +42: Time to load utils op: 0.0003685951232910156 seconds +42: Time to load utils op: 0.0003521442413330078 seconds +43: Time to load utils op: 0.0004279613494873047 seconds +48: Time to load utils op: 0.0003886222839355469 seconds +47: Time to load utils op: 0.0003871917724609375 seconds +47: Time to load utils op: 0.000362396240234375 seconds +43: Time to load utils op: 0.0004100799560546875 seconds +48: Time to load utils op: 0.0003561973571777344 seconds +48: Time to load utils op: 0.0003399848937988281 seconds +43: Time to load utils op: 0.0003986358642578125 seconds +46: Time to load utils op: 0.0003483295440673828 seconds +46: Time to load utils op: 0.0003418922424316406 seconds +49: Time to load utils op: 0.0003783702850341797 secondsTime to load utils op: 0.00037980079650878906 seconds +49: +49: Time to load utils op: 0.0003762245178222656 secondsTime to load utils op: 0.0003616809844970703 seconds +49: +53: Time to load utils op: 0.000362396240234375 seconds +51: Time to load utils op: 0.00036025047302246094 seconds +51: Time to load utils op: 0.00035834312438964844 seconds +53: Time to load utils op: 0.0003402233123779297 seconds +51: Time to load utils op: 0.0003662109375 seconds +56: Time to load utils op: 0.0003924369812011719 seconds +56: Time to load utils op: 0.0003848075866699219 seconds +56: Time to load utils op: 0.0003516674041748047 seconds +51: Time to load utils op: 0.00038552284240722656 seconds +56: Time to load utils op: 0.0003864765167236328 seconds +53: Time to load utils op: 0.0003952980041503906 seconds +54: Time to load utils op: 0.0003819465637207031 seconds +54: Time to load utils op: 0.0004069805145263672 seconds +53: Time to load utils op: 0.00040602684020996094 seconds +54: Time to load utils op: 0.00037026405334472656 seconds +52: Time to load utils op: 0.00038504600524902344 seconds +54: Time to load utils op: 0.0003466606140136719 seconds +52: Time to load utils op: 0.00039267539978027344 seconds +52: Time to load utils op: 0.0003578662872314453 seconds +55: Time to load utils op: 0.0003554821014404297 seconds +52: Time to load utils op: 0.00037479400634765625 seconds +55: Time to load utils op: 0.00041675567626953125 seconds +55: Time to load utils op: 0.0004131793975830078 seconds +55: Time to load utils op: 0.0003986358642578125 seconds +58: Time to load utils op: 0.00035858154296875 seconds +59: Time to load utils op: 0.0003790855407714844 seconds +59: Time to load utils op: 0.0003743171691894531 seconds +62: Time to load utils op: 0.0003726482391357422 seconds +58: Time to load utils op: 0.0003650188446044922 seconds +59: Time to load utils op: 0.0003707408905029297 seconds +58: Time to load utils op: 0.0003752708435058594 seconds +58: Time to load utils op: 0.0003476142883300781 seconds +62: Time to load utils op: 0.00036597251892089844 seconds +61: Time to load utils op: 0.00036263465881347656 seconds +61: Time to load utils op: 0.00041031837463378906 seconds +61: Time to load utils op: 0.00039577484130859375 seconds +61: Time to load utils op: 0.00038886070251464844 seconds +62: Time to load utils op: 0.000347137451171875 seconds +60: Time to load utils op: 0.0004439353942871094 seconds +62: Time to load utils op: 0.00032067298889160156 seconds +60: Time to load utils op: 0.0003991127014160156 seconds +60: Time to load utils op: 0.00039887428283691406 seconds +60: Time to load utils op: 0.0003807544708251953 seconds +59: Time to load utils op: 0.0004131793975830078 seconds +63: Time to load utils op: 0.0003788471221923828 seconds +63: Time to load utils op: 0.00039315223693847656 seconds +63: Time to load utils op: 0.00039839744567871094 seconds +63: Time to load utils op: 0.0003631114959716797 seconds +32: Time to load utils op: 0.0004987716674804688 seconds + 0: [2023-04-29 10:58:39,798] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-04-29 10:58:39,799] [INFO] [utils.py:828:see_memory_usage] MA 12.64 GB Max_MA 12.64 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,799] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 42.07 GB, percent = 8.4% + 0: [2023-04-29 10:58:39,912] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-04-29 10:58:39,913] [INFO] [utils.py:828:see_memory_usage] MA 12.64 GB Max_MA 12.64 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 10:58:39,913] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.87 GB, percent = 8.3% + 0: [2023-04-29 10:58:39,913] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-04-29 10:58:39,913] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-04-29 10:58:39,913] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-04-29 10:58:39,913] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-04-29 10:58:39,914] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-04-29 10:58:39,914] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-04-29 10:58:39,914] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-04-29 10:58:39,914] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-04-29 10:58:39,914] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 4 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-04-29 10:58:39,915] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] train_batch_size ............. 512 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 1 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] world_size ................... 128 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-04-29 10:58:39,916] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 1, + 0: "train_batch_size": 512, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.0028722286224365234 seconds + 0: [2023-04-29 10:58:39,919] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=4 micro_batch_size=1 + 0: [2023-04-29 10:58:40,848] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=24 [0, 24) STAGE_PARAMS=2226419712 (2226.420M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) + 0: [2023-04-29 10:58:40,848] [INFO] [engine.py:145:__init__] RANK=1 STAGE=0 LAYERS=24 [0, 24) STAGE_PARAMS=2226419712 (2226.420M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +32: [2023-04-29 10:58:40,854] [INFO] [engine.py:145:__init__] RANK=257 STAGE=1 LAYERS=25 [24, 49) STAGE_PARAMS=2226427904 (2226.428M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +32: [2023-04-29 10:58:40,854] [INFO] [engine.py:145:__init__] RANK=256 STAGE=1 LAYERS=25 [24, 49) STAGE_PARAMS=2226427904 (2226.428M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +56: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 10:58:41,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 6: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +42: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +11: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 10:58:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 8: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 8: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +35: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +21: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +21: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +27: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 2: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 7: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 4: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 2: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 10:58:41,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 7: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +34: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 4: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 4: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +32: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +54: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 4: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +13: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +33: [2023-04-29 10:58:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +20: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +43: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +20: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +30: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +44: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +14: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +26: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +59: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +26: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +26: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +59: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +48: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +57: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +48: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +50: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +25: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +25: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +60: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +28: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 1: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +17: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +17: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +63: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 10:58:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +10: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +31: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +10: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +31: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 10:58:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +28: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +28: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +28: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +34: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +31: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +49: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +34: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +31: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +34: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +53: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +31: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +55: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +53: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +47: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +47: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +51: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +34: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +16: [2023-04-29 10:58:41,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 10:58:41,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 10:58:41,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:41,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +56: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +56: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 9: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +56: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 6: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +22: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +14: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +14: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 10:58:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +15: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +42: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +27: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +56: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +42: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +20: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +20: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +45: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +15: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +15: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +32: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +32: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +44: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +45: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +30: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +54: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +34: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +34: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +34: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +35: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +53: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 7: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +40: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 4: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +52: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +52: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +36: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 0: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +53: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 7: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +40: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +15: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +57: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +13: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +34: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +32: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 4: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +33: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +15: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +13: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +33: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 0: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +42: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +49: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +20: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +52: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. + 7: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +42: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +15: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +60: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +60: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +20: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +32: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +26: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +26: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +54: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +19: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +44: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +20: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +60: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +34: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +19: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +38: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +37: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +26: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +53: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +15: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +24: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +33: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +13: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +44: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +24: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +32: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +24: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +41: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +47: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +33: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +33: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +25: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +25: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +53: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +49: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +63: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +50: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 3: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +60: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +25: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +38: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +10: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +60: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +13: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +19: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +38: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +31: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +31: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +10: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +10: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +38: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 5: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +60: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +13: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +37: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +31: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +38: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +51: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +51: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +28: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +10: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +37: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +24: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +63: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +19: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +23: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +51: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +23: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +52: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +25: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +31: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_01_model_states.pt. +46: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +24: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +10: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +31: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +63: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +51: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +63: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +23: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +58: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 10:58:41,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 10:58:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 10:58:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 10:58:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +11: [2023-04-29 10:58:42,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 10:58:42,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 10:58:42,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 10:58:42,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 10:58:42,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 10:58:42,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 10:58:42,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 10:58:42,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:42,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 10:58:42,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 10:58:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 10:58:42,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:42,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:42,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 10:58:42,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 10:58:42,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:42,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 10:58:42,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:42,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 10:58:42,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:42,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 10:58:42,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:42,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 10:58:42,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +19: [2023-04-29 10:58:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +15: [2023-04-29 10:58:42,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +15: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +15: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 10:58:42,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 10:58:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 10:58:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 10:58:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 10:58:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 10:58:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 10:58:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 10:58:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 10:58:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +19: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 10:58:42,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:42,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +19: [2023-04-29 10:58:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 10:58:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 10:58:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 10:58:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 10:58:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 10:58:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:42,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 10:58:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +17: [2023-04-29 10:58:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 10:58:42,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 10:58:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +17: [2023-04-29 10:58:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:42,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 10:58:42,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +62: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +23: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +62: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 7: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 10:58:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... + 7: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:42,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 10:58:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 10:58:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +20: [2023-04-29 10:58:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 10:58:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +23: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 10:58:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +30: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 10:58:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +16: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +23: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 0: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 10:58:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... + 0: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:42,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 10:58:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +30: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +43: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +43: [2023-04-29 10:58:42,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +22: [2023-04-29 10:58:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +43: [2023-04-29 10:58:42,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +10: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +43: [2023-04-29 10:58:42,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +43: [2023-04-29 10:58:42,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +43: [2023-04-29 10:58:42,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... + 5: [2023-04-29 10:58:42,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +43: [2023-04-29 10:58:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +22: [2023-04-29 10:58:42,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 10:58:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 4: [2023-04-29 10:58:42,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +45: [2023-04-29 10:58:42,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +10: [2023-04-29 10:58:42,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 10:58:42,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 10:58:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +45: [2023-04-29 10:58:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +45: [2023-04-29 10:58:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +45: [2023-04-29 10:58:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 10:58:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +10: [2023-04-29 10:58:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 10:58:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 10:58:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 10:58:42,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 10:58:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +21: [2023-04-29 10:58:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 10:58:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 10:58:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 10:58:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +13: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 10:58:42,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 10:58:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +31: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +62: [2023-04-29 10:58:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... + 7: [2023-04-29 10:58:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 10:58:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 10:58:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... + 0: [2023-04-29 10:58:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 10:58:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +43: [2023-04-29 10:58:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +13: [2023-04-29 10:58:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 10:58:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 10:58:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 10:58:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +53: [2023-04-29 10:58:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:42,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 10:58:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 10:58:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 10:58:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +16: [2023-04-29 10:58:42,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:42,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:42,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +13: [2023-04-29 10:58:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 10:58:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 10:58:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 10:58:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +23: [2023-04-29 10:58:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 10:58:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 10:58:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 10:58:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 10:58:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 10:58:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 10:58:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 10:58:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:42,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:42,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:42,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 10:58:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 10:58:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 10:58:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 10:58:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:42,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:42,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 10:58:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +37: [2023-04-29 10:58:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 10:58:42,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:42,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 10:58:42,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 10:58:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:42,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:42,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 10:58:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:42,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 10:58:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 10:58:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 10:58:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 10:58:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 10:58:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +46: [2023-04-29 10:58:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +51: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +46: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 10:58:42,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 10:58:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 10:58:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 10:58:42,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 10:58:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 10:58:42,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 10:58:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 10:58:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:42,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 10:58:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 10:58:42,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 10:58:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 10:58:42,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 10:58:42,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:42,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 10:58:42,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +63: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 10:58:42,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 10:58:42,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 10:58:42,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 10:58:42,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 10:58:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 10:58:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +63: [2023-04-29 10:58:42,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +63: [2023-04-29 10:58:42,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 10:58:42,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:42,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:42,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:42,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 10:58:42,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 10:58:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:42,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 10:58:42,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 10:58:42,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 10:58:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 10:58:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 10:58:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 10:58:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 10:58:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 1: [2023-04-29 10:58:42,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 1: [2023-04-29 10:58:42,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 1: [2023-04-29 10:58:42,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +59: [2023-04-29 10:58:42,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:42,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 10:58:42,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 10:58:42,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:42,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:42,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 10:58:42,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 10:58:42,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 10:58:42,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 10:58:42,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 1: [2023-04-29 10:58:42,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 10:58:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 10:58:42,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +27: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +27: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +27: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +59: [2023-04-29 10:58:42,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +27: [2023-04-29 10:58:42,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +41: [2023-04-29 10:58:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 10:58:42,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 10:58:42,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 10:58:42,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:42,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 10:58:42,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 10:58:42,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 10:58:42,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 10:58:42,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:42,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:42,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:42,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:42,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:42,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:42,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +56: [2023-04-29 10:58:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +56: [2023-04-29 10:58:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 10:58:42,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 10:58:42,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 10:58:42,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:42,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +27: [2023-04-29 10:58:42,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 10:58:42,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 10:58:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 10:58:42,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:42,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:42,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 10:58:42,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +27: [2023-04-29 10:58:42,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 10:58:42,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:42,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:42,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +29: [2023-04-29 10:58:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 10:58:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 10:58:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 10:58:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +11: [2023-04-29 10:58:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +11: [2023-04-29 10:58:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +11: [2023-04-29 10:58:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +56: [2023-04-29 10:58:42,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +11: [2023-04-29 10:58:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 10:58:42,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 10:58:42,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 10:58:42,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 10:58:42,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +56: [2023-04-29 10:58:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 10:58:42,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +20: [2023-04-29 10:58:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +20: [2023-04-29 10:58:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +20: [2023-04-29 10:58:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +20: [2023-04-29 10:58:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 10:58:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 10:58:42,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 10:58:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 10:58:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +56: [2023-04-29 10:58:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 10:58:42,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 10:58:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +56: [2023-04-29 10:58:42,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +18: [2023-04-29 10:58:42,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 10:58:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 10:58:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 10:58:42,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 10:58:42,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 10:58:42,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +56: [2023-04-29 10:58:42,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 10:58:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:42,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:42,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 10:58:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 10:58:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 10:58:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 10:58:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 10:58:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 10:58:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 10:58:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 10:58:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 10:58:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +28: [2023-04-29 10:58:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +16: [2023-04-29 10:58:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 10:58:42,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 10:58:42,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +28: [2023-04-29 10:58:42,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +45: [2023-04-29 10:58:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +45: [2023-04-29 10:58:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +18: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +16: [2023-04-29 10:58:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 10:58:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 10:58:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 10:58:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 10:58:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 10:58:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 10:58:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 10:58:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 10:58:42,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 10:58:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 10:58:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 10:58:42,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 10:58:42,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 10:58:42,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:42,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:42,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:42,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:42,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:42,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 0: [2023-04-29 10:58:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 0: [2023-04-29 10:58:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 10:58:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 10:58:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 10:58:42,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:42,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:42,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 10:58:42,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 10:58:42,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 10:58:42,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 10:58:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 10:58:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 10:58:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 10:58:42,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 10:58:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 10:58:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 10:58:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 10:58:42,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 10:58:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 10:58:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 10:58:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 10:58:42,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 0: [2023-04-29 10:58:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 10:58:42,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 10:58:42,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 10:58:42,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:42,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 10:58:42,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 10:58:42,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 10:58:42,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 10:58:42,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 10:58:42,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 10:58:42,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 10:58:42,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 10:58:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 10:58:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 10:58:42,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +23: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +23: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 10:58:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 10:58:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 10:58:42,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 10:58:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +45: [2023-04-29 10:58:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 10:58:42,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 10:58:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 10:58:42,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +24: [2023-04-29 10:58:42,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +24: [2023-04-29 10:58:42,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +24: [2023-04-29 10:58:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +31: [2023-04-29 10:58:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +31: [2023-04-29 10:58:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 10:58:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +45: [2023-04-29 10:58:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 10:58:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 10:58:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 10:58:42,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 10:58:42,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:42,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 10:58:42,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 3: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +34: [2023-04-29 10:58:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +13: [2023-04-29 10:58:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +22: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +15: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 10:58:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +34: [2023-04-29 10:58:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +23: [2023-04-29 10:58:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:42,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 10:58:42,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +23: [2023-04-29 10:58:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:42,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 10:58:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +53: [2023-04-29 10:58:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:42,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:42,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +34: [2023-04-29 10:58:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +34: [2023-04-29 10:58:42,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 10:58:42,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 10:58:42,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:42,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:42,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:42,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:42,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:42,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 10:58:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 10:58:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 10:58:42,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 10:58:42,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:42,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:42,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +34: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 10:58:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 10:58:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:42,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:42,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:42,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 10:58:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 10:58:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 10:58:43,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:43,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 10:58:43,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 5: [2023-04-29 10:58:43,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 5: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 5: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 10:58:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +47: [2023-04-29 10:58:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 10:58:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 10:58:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 10:58:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +47: [2023-04-29 10:58:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +47: [2023-04-29 10:58:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... +25: [2023-04-29 10:58:43,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +49: [2023-04-29 10:58:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +53: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +25: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +60: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +50: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +43: [2023-04-29 10:58:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +60: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 10:58:43,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +49: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:43,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +43: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 10:58:43,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:43,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 10:58:43,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 10:58:43,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 10:58:43,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 10:58:43,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 10:58:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 10:58:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 10:58:43,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:43,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +43: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +35: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 10:58:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 10:58:43,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 10:58:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 10:58:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +53: [2023-04-29 10:58:43,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 10:58:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 10:58:43,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:43,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 10:58:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:43,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 10:58:43,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +27: [2023-04-29 10:58:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 10:58:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 10:58:43,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 10:58:43,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:43,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 10:58:43,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 10:58:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +53: [2023-04-29 10:58:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 10:58:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 10:58:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 10:58:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 10:58:43,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 10:58:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 10:58:43,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +58: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 10:58:43,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 10:58:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +18: [2023-04-29 10:58:43,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 10:58:43,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 10:58:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 10:58:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 10:58:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 10:58:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 10:58:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:43,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 10:58:43,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 10:58:43,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:43,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 10:58:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 10:58:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:43,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +42: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +44: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +28: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +49: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +21: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 10:58:43,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +21: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +37: [2023-04-29 10:58:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +28: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 10:58:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +28: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 10:58:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +61: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +52: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +59: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +28: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +41: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +49: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +54: [2023-04-29 10:58:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +10: [2023-04-29 10:58:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +50: [2023-04-29 10:58:43,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +52: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +41: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +10: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +19: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +10: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 4: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +20: [2023-04-29 10:58:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +20: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +52: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +20: [2023-04-29 10:58:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +43: [2023-04-29 10:58:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +47: [2023-04-29 10:58:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +10: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 10:58:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 4: [2023-04-29 10:58:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +10: [2023-04-29 10:58:43,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +32: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +39: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 4: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +35: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +43: [2023-04-29 10:58:43,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +51: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 10:58:43,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 10:58:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 10:58:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +51: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:43,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:43,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 10:58:43,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:43,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 10:58:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +29: [2023-04-29 10:58:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 10:58:43,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 10:58:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +49: [2023-04-29 10:58:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 10:58:43,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 10:58:43,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:43,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +38: [2023-04-29 10:58:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 10:58:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 10:58:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +46: [2023-04-29 10:58:43,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 10:58:43,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 10:58:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +41: [2023-04-29 10:58:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 10:58:43,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 10:58:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +44: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 10:58:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 10:58:43,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 10:58:43,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +37: [2023-04-29 10:58:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 10:58:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +37: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 0: [2023-04-29 10:58:43,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 0: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +41: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +55: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 10:58:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 10:58:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 10:58:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 10:58:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +41: [2023-04-29 10:58:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +19: [2023-04-29 10:58:43,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 10:58:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 10:58:43,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +33: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 10:58:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +54: [2023-04-29 10:58:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 10:58:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 10:58:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +38: [2023-04-29 10:58:43,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 10:58:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 10:58:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +44: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +31: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +61: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +48: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +11: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +56: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +46: [2023-04-29 10:58:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +61: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +33: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 10:58:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 10:58:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 10:58:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +55: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +31: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +29: [2023-04-29 10:58:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +36: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +32: [2023-04-29 10:58:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 7: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +36: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +36: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +20: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 10:58:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +33: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +39: [2023-04-29 10:58:43,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 7: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +51: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +55: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +33: [2023-04-29 10:58:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 10:58:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 10:58:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +29: [2023-04-29 10:58:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 10:58:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 10:58:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 10:58:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 10:58:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 10:58:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 10:58:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 10:58:43,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 10:58:43,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 10:58:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 10:58:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 10:58:43,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +32: [2023-04-29 10:58:43,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +56: [2023-04-29 10:58:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 10:58:43,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 10:58:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 10:58:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 10:58:43,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 10:58:43,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 10:58:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 10:58:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +51: [2023-04-29 10:58:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:43,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +51: [2023-04-29 10:58:43,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +40: [2023-04-29 10:58:43,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +40: [2023-04-29 10:58:43,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 10:58:43,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 10:58:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 10:58:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +14: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 7: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:43,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 10:58:43,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 10:58:43,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +34: [2023-04-29 10:58:43,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 10:58:43,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 10:58:43,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:43,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:43,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 10:58:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 10:58:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 10:58:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 10:58:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 10:58:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +34: [2023-04-29 10:58:43,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 10:58:43,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 10:58:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 10:58:43,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 10:58:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 10:58:43,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +31: [2023-04-29 10:58:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 10:58:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 10:58:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 10:58:43,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 10:58:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 10:58:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +16: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +16: [2023-04-29 10:58:43,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +47: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 10:58:43,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 10:58:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 10:58:43,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:43,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 10:58:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:43,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:43,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 10:58:43,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 10:58:43,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 10:58:43,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 10:58:43,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 10:58:43,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:43,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:43,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:43,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:43,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 10:58:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 10:58:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 10:58:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 10:58:43,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 10:58:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 10:58:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 10:58:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 10:58:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +36: [2023-04-29 10:58:43,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +36: [2023-04-29 10:58:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +36: [2023-04-29 10:58:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +36: [2023-04-29 10:58:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 10:58:43,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 10:58:43,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 10:58:43,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 10:58:43,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 10:58:43,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 10:58:43,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 10:58:43,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 10:58:43,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +26: [2023-04-29 10:58:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 10:58:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 10:58:43,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 10:58:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 10:58:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 10:58:43,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 10:58:43,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt. +57: [2023-04-29 10:58:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 10:58:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 10:58:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 10:58:43,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +63: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +50: [2023-04-29 10:58:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 10:58:43,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 10:58:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 10:58:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 10:58:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:43,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:43,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 10:58:43,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:43,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:43,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:43,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 10:58:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 10:58:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 10:58:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +45: [2023-04-29 10:58:43,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 10:58:43,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:43,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:43,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:43,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +27: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +27: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +27: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +52: [2023-04-29 10:58:43,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +62: [2023-04-29 10:58:43,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +29: [2023-04-29 10:58:43,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 10:58:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 10:58:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 10:58:43,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 10:58:43,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +61: [2023-04-29 10:58:43,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 10:58:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 10:58:43,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 10:58:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +62: [2023-04-29 10:58:43,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +61: [2023-04-29 10:58:43,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +61: [2023-04-29 10:58:43,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +62: [2023-04-29 10:58:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 10:58:43,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +61: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 10:58:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 10:58:43,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +42: [2023-04-29 10:58:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +61: [2023-04-29 10:58:43,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 10:58:43,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 10:58:43,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 10:58:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +45: [2023-04-29 10:58:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 10:58:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 10:58:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +45: [2023-04-29 10:58:43,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +45: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +58: [2023-04-29 10:58:43,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 10:58:43,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 10:58:43,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 10:58:43,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +27: [2023-04-29 10:58:43,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:43,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 10:58:43,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 10:58:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... + 3: [2023-04-29 10:58:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 10:58:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 10:58:43,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +27: [2023-04-29 10:58:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +54: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 10:58:43,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +42: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +18: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +18: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +18: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +42: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +18: [2023-04-29 10:58:43,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +57: [2023-04-29 10:58:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 10:58:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:43,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 10:58:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +53: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:43,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 10:58:43,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +48: [2023-04-29 10:58:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 10:58:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 10:58:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 10:58:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 6: [2023-04-29 10:58:43,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +53: [2023-04-29 10:58:43,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +53: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:43,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 10:58:43,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 10:58:43,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 10:58:43,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 10:58:43,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +45: [2023-04-29 10:58:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 10:58:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:43,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 10:58:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +43: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 1: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 1: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 1: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 1: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +58: [2023-04-29 10:58:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 10:58:43,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 10:58:43,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +45: [2023-04-29 10:58:43,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 10:58:43,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:43,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +41: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 10:58:43,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 10:58:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +17: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +17: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +17: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +58: [2023-04-29 10:58:43,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +17: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 10:58:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +43: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +43: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +43: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +30: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +30: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +30: [2023-04-29 10:58:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +58: [2023-04-29 10:58:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 10:58:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 10:58:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +35: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +22: [2023-04-29 10:58:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 10:58:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +58: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 10:58:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 10:58:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 10:58:43,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:43,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 10:58:43,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:43,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +10: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 10:58:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:43,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:43,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +10: [2023-04-29 10:58:43,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:43,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 10:58:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 10:58:43,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +33: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. + 0: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 0: [2023-04-29 10:58:43,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 0: [2023-04-29 10:58:43,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +41: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 10:58:43,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 10:58:43,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:43,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +20: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +20: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +30: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +43: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +55: [2023-04-29 10:58:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +11: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +11: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +11: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:43,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 10:58:43,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:43,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:43,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:43,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:43,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:43,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 10:58:43,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 10:58:43,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 10:58:43,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 10:58:43,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 10:58:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 10:58:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +54: [2023-04-29 10:58:43,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 10:58:43,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 10:58:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:43,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 10:58:43,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +49: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +54: [2023-04-29 10:58:43,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 10:58:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +45: [2023-04-29 10:58:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 10:58:43,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +11: [2023-04-29 10:58:43,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:43,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +11: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +11: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +20: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +48: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +53: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 10:58:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:43,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +54: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 10:58:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 10:58:43,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:43,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:43,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 10:58:43,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 10:58:43,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +58: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 10:58:43,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 10:58:43,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 10:58:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:43,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 10:58:43,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 10:58:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:43,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:43,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:43,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 10:58:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 10:58:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 10:58:43,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 10:58:43,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +38: [2023-04-29 10:58:43,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 10:58:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 10:58:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 10:58:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 10:58:43,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 10:58:43,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 10:58:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 10:58:43,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:43,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:43,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:43,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +15: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:43,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 10:58:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:43,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +21: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +54: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +19: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +19: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 10:58:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +19: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +43: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 10:58:43,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 10:58:43,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 10:58:43,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 10:58:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +14: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +14: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +14: [2023-04-29 10:58:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +14: [2023-04-29 10:58:43,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 10:58:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +19: [2023-04-29 10:58:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +41: [2023-04-29 10:58:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 10:58:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 10:58:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +15: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +19: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +41: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +53: [2023-04-29 10:58:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +19: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +37: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +37: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +41: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +37: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +15: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +55: [2023-04-29 10:58:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 9: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 9: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. + 9: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +38: [2023-04-29 10:58:43,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +37: [2023-04-29 10:58:43,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. + 7: [2023-04-29 10:58:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 10:58:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +23: [2023-04-29 10:58:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +53: [2023-04-29 10:58:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 10:58:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +23: [2023-04-29 10:58:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +33: [2023-04-29 10:58:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +50: [2023-04-29 10:58:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +50: [2023-04-29 10:58:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 10:58:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 10:58:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 10:58:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:43,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 10:58:43,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:43,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:43,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:43,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 10:58:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 10:58:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +43: [2023-04-29 10:58:43,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 10:58:43,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 10:58:43,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 10:58:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +13: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +13: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +13: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +13: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +43: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:43,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 10:58:43,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +37: [2023-04-29 10:58:43,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:43,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 10:58:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 10:58:43,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 10:58:43,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 10:58:43,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +59: [2023-04-29 10:58:43,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 10:58:43,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 10:58:43,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +20: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +20: [2023-04-29 10:58:43,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 10:58:43,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +48: [2023-04-29 10:58:43,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 10:58:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 10:58:43,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 10:58:43,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 10:58:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +20: [2023-04-29 10:58:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 10:58:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 10:58:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +43: [2023-04-29 10:58:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:43,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 10:58:43,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:43,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 10:58:43,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:43,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 10:58:43,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +39: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +25: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:43,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 10:58:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:43,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 10:58:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +40: [2023-04-29 10:58:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +40: [2023-04-29 10:58:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +13: [2023-04-29 10:58:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 10:58:43,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 10:58:43,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +15: [2023-04-29 10:58:43,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 10:58:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 10:58:43,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:43,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +25: [2023-04-29 10:58:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 10:58:43,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 10:58:43,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:43,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 10:58:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 10:58:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:43,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:43,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 10:58:43,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:43,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:43,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 10:58:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 10:58:43,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 10:58:43,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:43,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +46: [2023-04-29 10:58:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:43,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 10:58:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:43,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 10:58:43,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:43,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 10:58:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 10:58:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:43,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 10:58:43,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:43,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 10:58:43,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 10:58:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 10:58:43,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 10:58:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +21: [2023-04-29 10:58:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +32: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:43,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +59: [2023-04-29 10:58:43,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 10:58:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 10:58:43,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 10:58:43,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 10:58:43,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:43,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 10:58:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +23: [2023-04-29 10:58:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +47: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +59: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:43,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:43,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:43,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:43,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +15: [2023-04-29 10:58:43,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:43,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:43,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 10:58:43,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 10:58:43,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 10:58:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +33: [2023-04-29 10:58:43,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 10:58:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +59: [2023-04-29 10:58:43,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. + 3: [2023-04-29 10:58:43,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. + 3: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +52: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:43,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +23: [2023-04-29 10:58:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:43,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 10:58:43,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:43,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 10:58:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 10:58:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +39: [2023-04-29 10:58:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 10:58:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:43,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 10:58:43,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +37: [2023-04-29 10:58:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 10:58:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:43,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:43,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 10:58:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 10:58:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +40: [2023-04-29 10:58:43,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +21: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +21: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 10:58:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 10:58:43,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:43,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:43,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +21: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:43,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 10:58:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 10:58:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 10:58:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 10:58:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:43,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 10:58:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:43,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +56: [2023-04-29 10:58:43,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +12: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 10:58:43,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +25: [2023-04-29 10:58:43,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:43,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:43,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 10:58:43,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 10:58:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 10:58:43,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:43,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +56: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +56: [2023-04-29 10:58:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 10:58:43,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +32: [2023-04-29 10:58:43,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 10:58:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +25: [2023-04-29 10:58:43,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 10:58:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 10:58:43,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 10:58:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 10:58:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 10:58:43,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 10:58:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 10:58:43,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 10:58:43,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 10:58:43,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:43,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:43,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 10:58:43,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 10:58:43,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 10:58:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 10:58:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 10:58:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 10:58:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +25: [2023-04-29 10:58:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 10:58:43,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +55: [2023-04-29 10:58:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 10:58:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 10:58:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 10:58:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:43,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 10:58:43,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 10:58:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 10:58:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 10:58:43,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:43,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 10:58:43,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 10:58:43,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:43,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 10:58:43,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:43,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:43,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:43,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:43,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 10:58:43,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +59: [2023-04-29 10:58:43,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:43,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 10:58:43,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:43,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +63: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +47: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +21: [2023-04-29 10:58:43,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +47: [2023-04-29 10:58:43,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +47: [2023-04-29 10:58:43,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 10:58:43,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +39: [2023-04-29 10:58:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 10:58:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +63: [2023-04-29 10:58:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +63: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 10:58:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 10:58:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +59: [2023-04-29 10:58:43,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +22: [2023-04-29 10:58:43,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +33: [2023-04-29 10:58:43,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +22: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +22: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +22: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +22: [2023-04-29 10:58:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 10:58:43,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 10:58:43,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 10:58:43,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:43,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:43,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 10:58:43,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 5: [2023-04-29 10:58:43,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +44: [2023-04-29 10:58:43,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 5: [2023-04-29 10:58:43,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +44: [2023-04-29 10:58:43,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:43,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:43,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:43,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 10:58:43,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 10:58:43,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:43,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:43,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:43,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:43,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:43,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 10:58:43,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:43,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 10:58:43,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 10:58:43,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +47: [2023-04-29 10:58:43,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 10:58:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +34: [2023-04-29 10:58:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +27: [2023-04-29 10:58:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:43,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +34: [2023-04-29 10:58:43,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:43,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 10:58:43,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +18: [2023-04-29 10:58:43,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 10:58:43,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 10:58:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 10:58:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +18: [2023-04-29 10:58:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +34: [2023-04-29 10:58:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt... +18: [2023-04-29 10:58:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 10:58:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +18: [2023-04-29 10:58:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +51: [2023-04-29 10:58:43,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:43,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +63: [2023-04-29 10:58:43,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:43,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +63: [2023-04-29 10:58:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 10:58:43,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 10:58:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 10:58:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 10:58:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:43,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 10:58:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 10:58:44,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +16: [2023-04-29 10:58:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +16: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +22: [2023-04-29 10:58:44,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +25: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +25: [2023-04-29 10:58:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +47: [2023-04-29 10:58:44,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +25: [2023-04-29 10:58:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:44,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:44,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 10:58:44,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:44,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:44,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:44,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:44,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:44,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 10:58:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:44,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:44,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 10:58:44,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 10:58:44,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 10:58:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:44,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +26: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 10:58:44,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 10:58:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 10:58:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 10:58:44,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 10:58:44,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 10:58:44,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 10:58:44,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 10:58:44,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +24: [2023-04-29 10:58:44,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 10:58:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:44,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:44,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:44,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 10:58:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 10:58:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 10:58:44,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 10:58:44,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +36: [2023-04-29 10:58:44,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:44,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +24: [2023-04-29 10:58:44,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:44,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 10:58:44,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 10:58:44,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:44,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 10:58:44,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 10:58:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:44,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:44,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 10:58:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +25: [2023-04-29 10:58:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +25: [2023-04-29 10:58:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +62: [2023-04-29 10:58:44,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +28: [2023-04-29 10:58:44,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 10:58:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 10:58:44,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 10:58:44,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:44,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:44,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +17: [2023-04-29 10:58:44,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +17: [2023-04-29 10:58:44,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +36: [2023-04-29 10:58:44,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +17: [2023-04-29 10:58:44,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +62: [2023-04-29 10:58:44,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:44,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 10:58:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 10:58:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:44,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 10:58:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 10:58:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 10:58:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 10:58:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 10:58:44,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 10:58:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +36: [2023-04-29 10:58:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +28: [2023-04-29 10:58:44,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +50: [2023-04-29 10:58:44,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:44,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 10:58:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 10:58:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 10:58:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 10:58:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. + 6: [2023-04-29 10:58:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 6: [2023-04-29 10:58:44,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +42: [2023-04-29 10:58:44,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +42: [2023-04-29 10:58:44,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 6: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 10:58:44,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 10:58:44,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 10:58:44,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 10:58:44,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 10:58:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:44,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 10:58:44,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 10:58:44,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +29: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 10:58:44,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +52: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +52: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:44,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:44,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 10:58:44,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +17: [2023-04-29 10:58:44,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 10:58:44,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +31: [2023-04-29 10:58:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:44,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +31: [2023-04-29 10:58:44,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +30: [2023-04-29 10:58:44,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:44,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +30: [2023-04-29 10:58:44,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +62: [2023-04-29 10:58:44,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +31: [2023-04-29 10:58:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +31: [2023-04-29 10:58:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:44,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +31: [2023-04-29 10:58:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 10:58:44,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:44,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +30: [2023-04-29 10:58:44,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:44,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +30: [2023-04-29 10:58:44,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 10:58:44,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 10:58:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 10:58:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 10:58:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 10:58:44,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 10:58:44,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +63: [2023-04-29 10:58:44,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 10:58:44,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 10:58:44,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 10:58:44,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +10: [2023-04-29 10:58:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 10:58:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 10:58:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 10:58:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +62: [2023-04-29 10:58:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 7: [2023-04-29 10:58:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +17: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:44,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:44,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +10: [2023-04-29 10:58:44,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 10:58:44,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 10:58:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +50: [2023-04-29 10:58:44,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 6: [2023-04-29 10:58:44,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 10:58:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 6: [2023-04-29 10:58:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +50: [2023-04-29 10:58:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 6: [2023-04-29 10:58:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +46: [2023-04-29 10:58:44,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:44,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:44,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:44,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:44,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:44,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 10:58:44,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 10:58:44,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 10:58:44,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 10:58:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 10:58:44,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:44,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 10:58:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 10:58:44,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 10:58:44,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:44,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 4: [2023-04-29 10:58:44,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:44,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:44,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +29: [2023-04-29 10:58:44,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 10:58:44,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:44,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:44,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +31: [2023-04-29 10:58:44,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 10:58:44,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:44,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:44,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:44,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 10:58:44,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 10:58:44,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:44,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 10:58:44,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 10:58:44,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 10:58:44,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 10:58:44,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 10:58:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +52: [2023-04-29 10:58:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 10:58:44,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +31: [2023-04-29 10:58:44,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:44,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +31: [2023-04-29 10:58:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 10:58:44,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 10:58:44,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 10:58:44,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 10:58:44,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 10:58:44,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:44,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 10:58:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 10:58:44,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 10:58:44,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:44,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:44,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:44,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 10:58:44,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:44,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:44,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:44,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 10:58:44,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:44,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 10:58:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 10:58:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 10:58:44,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 10:58:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +46: [2023-04-29 10:58:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:44,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +31: [2023-04-29 10:58:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 10:58:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 10:58:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +31: [2023-04-29 10:58:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:44,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:44,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +30: [2023-04-29 10:58:44,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:44,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 10:58:44,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 7: [2023-04-29 10:58:44,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 7: [2023-04-29 10:58:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +43: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 10:58:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +63: [2023-04-29 10:58:44,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +63: [2023-04-29 10:58:44,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +10: [2023-04-29 10:58:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:44,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +44: [2023-04-29 10:58:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +44: [2023-04-29 10:58:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +10: [2023-04-29 10:58:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +10: [2023-04-29 10:58:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 10:58:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +43: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 10:58:44,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:44,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:44,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 10:58:44,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 10:58:44,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +48: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +44: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +55: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +55: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. + 9: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:44,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 10:58:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 10:58:44,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 10:58:44,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 10:58:44,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 10:58:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 10:58:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 10:58:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 10:58:44,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 10:58:44,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:44,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 10:58:44,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 10:58:44,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:44,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:44,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 10:58:44,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +62: [2023-04-29 10:58:44,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 10:58:44,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 10:58:44,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 10:58:44,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +11: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +11: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 10:58:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +11: [2023-04-29 10:58:44,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:44,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:44,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:44,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:44,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:44,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:44,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 10:58:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 10:58:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 10:58:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 10:58:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 10:58:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:44,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 10:58:44,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 10:58:44,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 10:58:44,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 10:58:44,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:44,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:44,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 10:58:44,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +57: [2023-04-29 10:58:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +57: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:44,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:44,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:44,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +33: [2023-04-29 10:58:44,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +33: [2023-04-29 10:58:44,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +33: [2023-04-29 10:58:44,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:44,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:44,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +38: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +38: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 10:58:44,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 10:58:44,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 10:58:44,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:44,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:44,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 10:58:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +49: [2023-04-29 10:58:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +49: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. + 2: [2023-04-29 10:58:44,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +49: [2023-04-29 10:58:44,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 10:58:44,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:44,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. + 2: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +42: [2023-04-29 10:58:44,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +56: [2023-04-29 10:58:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +56: [2023-04-29 10:58:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +56: [2023-04-29 10:58:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 10:58:44,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 10:58:44,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 10:58:44,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 10:58:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 10:58:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 10:58:44,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 10:58:44,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 10:58:44,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +43: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 10:58:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 10:58:44,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:44,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 10:58:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +44: [2023-04-29 10:58:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +44: [2023-04-29 10:58:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 9: [2023-04-29 10:58:44,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:44,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:44,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +12: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +35: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +11: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 10:58:44,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. + 9: [2023-04-29 10:58:44,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 10:58:44,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:44,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:44,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 10:58:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +41: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 10:58:44,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 10:58:44,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:44,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:44,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 10:58:44,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +58: [2023-04-29 10:58:44,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 10:58:44,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 10:58:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 10:58:44,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:44,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 10:58:44,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 10:58:44,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 10:58:44,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 10:58:44,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +55: [2023-04-29 10:58:44,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +61: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +11: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 10:58:44,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 10:58:44,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +55: [2023-04-29 10:58:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... + 0: [2023-04-29 10:58:44,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 10:58:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 10:58:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 10:58:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 10:58:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 10:58:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 10:58:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 10:58:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 10:58:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 10:58:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 10:58:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +62: [2023-04-29 10:58:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 10:58:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 10:58:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:44,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +43: [2023-04-29 10:58:44,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:44,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 10:58:44,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +53: [2023-04-29 10:58:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +53: [2023-04-29 10:58:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +53: [2023-04-29 10:58:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 10:58:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:44,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 10:58:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 10:58:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:44,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 10:58:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:44,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 10:58:44,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 10:58:44,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:44,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +12: [2023-04-29 10:58:44,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +35: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +32: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 10:58:44,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +49: [2023-04-29 10:58:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 10:58:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 10:58:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:44,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 10:58:44,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 10:58:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +33: [2023-04-29 10:58:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 10:58:44,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 10:58:44,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 10:58:44,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 10:58:44,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +33: [2023-04-29 10:58:44,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +58: [2023-04-29 10:58:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 10:58:44,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 10:58:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +58: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +57: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +57: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 10:58:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 10:58:44,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 10:58:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 10:58:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +58: [2023-04-29 10:58:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +50: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +50: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 10:58:44,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 10:58:44,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +49: [2023-04-29 10:58:44,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 10:58:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 10:58:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +56: [2023-04-29 10:58:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +56: [2023-04-29 10:58:44,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 10:58:44,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +41: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +56: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 10:58:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 10:58:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 10:58:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 10:58:44,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +32: [2023-04-29 10:58:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 10:58:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 10:58:44,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 10:58:44,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 10:58:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 10:58:44,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +16: [2023-04-29 10:58:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 10:58:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 10:58:44,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 10:58:44,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +16: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +22: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:44,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +22: [2023-04-29 10:58:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 10:58:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +16: [2023-04-29 10:58:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +16: [2023-04-29 10:58:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +50: [2023-04-29 10:58:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 10:58:44,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:44,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 10:58:44,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:44,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 10:58:44,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 10:58:44,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +39: [2023-04-29 10:58:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 10:58:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 10:58:44,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 10:58:44,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 10:58:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +39: [2023-04-29 10:58:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 10:58:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 10:58:44,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 10:58:44,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +35: [2023-04-29 10:58:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:44,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 10:58:44,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 10:58:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +60: [2023-04-29 10:58:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 10:58:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 10:58:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 10:58:44,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 10:58:44,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 10:58:44,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 10:58:44,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 10:58:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 10:58:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 10:58:44,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:44,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:44,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:44,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 10:58:44,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:44,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +52: [2023-04-29 10:58:44,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 10:58:44,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +40: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +40: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +40: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 10:58:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 10:58:44,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +14: [2023-04-29 10:58:44,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 10:58:44,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:44,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:44,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:44,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +21: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 10:58:44,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +21: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 10:58:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:44,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:44,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 10:58:44,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +34: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 10:58:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 10:58:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 10:58:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 10:58:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 10:58:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +60: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 10:58:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +47: [2023-04-29 10:58:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +21: [2023-04-29 10:58:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 10:58:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +32: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 10:58:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +22: [2023-04-29 10:58:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 10:58:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 10:58:44,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 10:58:44,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 10:58:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 10:58:44,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +22: [2023-04-29 10:58:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 10:58:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 10:58:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 10:58:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:44,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:44,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:44,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 10:58:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 10:58:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 10:58:44,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:44,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 10:58:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:44,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:44,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 10:58:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 10:58:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +18: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 10:58:44,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 10:58:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 10:58:44,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:44,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 10:58:44,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 10:58:44,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +16: [2023-04-29 10:58:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 10:58:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 10:58:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:44,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 10:58:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 10:58:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:44,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:44,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 10:58:44,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 10:58:44,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 10:58:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 10:58:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 10:58:44,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt. +19: [2023-04-29 10:58:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 10:58:44,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 10:58:44,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:44,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 10:58:44,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 10:58:44,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:44,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 10:58:44,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 10:58:44,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:44,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 10:58:44,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +54: [2023-04-29 10:58:44,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 10:58:44,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 10:58:44,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 10:58:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:44,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 10:58:44,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 10:58:44,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 10:58:44,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 10:58:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +14: [2023-04-29 10:58:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 10:58:44,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:44,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 10:58:44,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 10:58:44,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 10:58:44,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +42: [2023-04-29 10:58:44,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +21: [2023-04-29 10:58:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 10:58:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +15: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +34: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +15: [2023-04-29 10:58:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 10:58:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 10:58:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 10:58:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 10:58:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +21: [2023-04-29 10:58:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 10:58:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +21: [2023-04-29 10:58:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 10:58:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 10:58:44,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 10:58:44,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 10:58:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 10:58:44,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 10:58:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 10:58:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 10:58:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 10:58:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 10:58:44,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 10:58:44,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:44,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 10:58:44,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 10:58:44,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:44,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 10:58:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 10:58:44,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:44,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 10:58:44,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +60: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +60: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +18: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +18: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:44,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:44,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +14: [2023-04-29 10:58:44,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 10:58:44,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:44,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 10:58:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +63: [2023-04-29 10:58:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:44,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 10:58:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +47: [2023-04-29 10:58:44,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 10:58:44,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +25: [2023-04-29 10:58:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:44,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:44,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:44,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +63: [2023-04-29 10:58:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 10:58:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 10:58:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 10:58:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:44,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 10:58:44,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:44,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:44,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 10:58:44,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +19: [2023-04-29 10:58:44,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:44,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:44,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +45: [2023-04-29 10:58:44,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 10:58:44,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:44,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:44,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 10:58:44,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 10:58:44,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:44,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 10:58:44,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 10:58:44,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:44,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 10:58:44,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:44,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +13: [2023-04-29 10:58:44,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 10:58:44,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +54: [2023-04-29 10:58:44,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +54: [2023-04-29 10:58:44,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 10:58:44,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:44,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 10:58:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +51: [2023-04-29 10:58:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +19: [2023-04-29 10:58:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:44,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:44,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 10:58:44,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +51: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +23: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +23: [2023-04-29 10:58:44,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:44,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:44,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 10:58:44,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +26: [2023-04-29 10:58:44,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +51: [2023-04-29 10:58:44,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 10:58:44,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +51: [2023-04-29 10:58:44,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +51: [2023-04-29 10:58:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt. +26: [2023-04-29 10:58:44,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:44,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:44,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 10:58:44,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:44,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 10:58:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:44,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt... +15: [2023-04-29 10:58:44,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 10:58:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt... +24: [2023-04-29 10:58:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +24: [2023-04-29 10:58:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:44,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +25: [2023-04-29 10:58:44,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 10:58:44,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +15: [2023-04-29 10:58:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 10:58:44,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:44,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +60: [2023-04-29 10:58:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:44,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:44,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +60: [2023-04-29 10:58:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 10:58:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:44,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:44,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 10:58:44,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 10:58:44,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:44,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:44,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:44,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:44,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 10:58:44,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 10:58:44,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 10:58:44,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 10:58:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 10:58:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 10:58:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:44,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:44,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 10:58:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:44,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:44,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 10:58:44,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 10:58:44,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +63: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +63: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:44,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +26: [2023-04-29 10:58:44,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +48: [2023-04-29 10:58:44,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:44,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:44,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 10:58:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +26: [2023-04-29 10:58:44,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 10:58:44,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 10:58:44,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:44,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 10:58:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 10:58:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 10:58:44,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +43: [2023-04-29 10:58:44,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 10:58:44,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:44,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:44,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 10:58:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:44,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:44,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:44,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:44,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 10:58:44,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:44,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:44,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:44,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:44,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:44,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 10:58:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 10:58:44,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 10:58:44,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 10:58:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:44,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 10:58:44,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +45: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +45: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +45: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +24: [2023-04-29 10:58:44,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:44,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +55: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 1: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +52: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +28: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +58: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:44,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +55: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:44,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:44,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:44,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +58: [2023-04-29 10:58:44,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:44,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +44: [2023-04-29 10:58:44,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 10:58:44,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 10:58:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 10:58:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 10:58:44,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:44,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:44,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:44,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +24: [2023-04-29 10:58:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 10:58:44,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 5: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +32: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +49: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 10:58:44,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 10:58:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 10:58:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 10:58:44,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 10:58:44,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:44,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 10:58:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:44,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +23: [2023-04-29 10:58:44,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 10:58:44,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +54: [2023-04-29 10:58:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 10:58:44,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 10:58:44,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +45: [2023-04-29 10:58:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 10:58:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:44,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:44,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:44,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:44,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 10:58:44,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:44,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 10:58:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 10:58:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +15: [2023-04-29 10:58:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 10:58:44,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 10:58:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:44,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 10:58:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 10:58:44,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 5: [2023-04-29 10:58:44,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +22: [2023-04-29 10:58:44,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +22: [2023-04-29 10:58:44,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +63: [2023-04-29 10:58:44,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:44,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:44,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:44,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:44,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:44,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:44,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:44,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 10:58:44,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 10:58:44,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 10:58:44,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 10:58:44,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 10:58:44,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:44,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 10:58:44,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:44,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:44,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:44,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 10:58:44,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:44,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 10:58:44,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:44,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:44,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:44,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:44,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 10:58:44,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 10:58:44,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:44,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:44,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:44,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:44,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 10:58:44,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +52: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 10:58:44,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:44,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 10:58:44,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 10:58:44,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 10:58:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 10:58:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +10: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +50: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +10: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +43: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +50: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +22: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +50: [2023-04-29 10:58:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 8: [2023-04-29 10:58:44,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 10:58:44,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 10:58:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +58: [2023-04-29 10:58:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 10:58:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 10:58:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +52: [2023-04-29 10:58:44,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 10:58:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:44,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +45: [2023-04-29 10:58:44,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +20: [2023-04-29 10:58:44,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +48: [2023-04-29 10:58:44,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:44,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 10:58:44,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +44: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 10:58:44,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +43: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 10:58:44,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +11: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 10:58:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 10:58:44,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:44,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 10:58:44,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +31: [2023-04-29 10:58:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:44,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +57: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 3: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +11: [2023-04-29 10:58:44,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +35: [2023-04-29 10:58:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 10:58:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 10:58:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 10:58:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:44,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 10:58:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +43: [2023-04-29 10:58:44,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 10:58:44,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 10:58:44,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 10:58:44,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +28: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +59: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +10: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +29: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +35: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 10:58:44,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 10:58:44,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 5: [2023-04-29 10:58:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +59: [2023-04-29 10:58:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 10:58:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 10:58:44,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 10:58:44,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:44,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +29: [2023-04-29 10:58:44,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 10:58:44,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:44,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +18: [2023-04-29 10:58:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +18: [2023-04-29 10:58:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +18: [2023-04-29 10:58:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 10:58:44,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 10:58:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 10:58:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 10:58:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +49: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +17: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 10:58:44,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:44,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:44,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:44,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 10:58:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 10:58:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 10:58:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +32: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 5: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +32: [2023-04-29 10:58:44,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:44,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:44,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:44,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 10:58:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:44,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 1: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 1: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 10:58:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:44,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:44,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:44,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 10:58:44,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +23: [2023-04-29 10:58:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 10:58:45,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +23: [2023-04-29 10:58:45,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 10:58:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 6: [2023-04-29 10:58:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +54: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 10:58:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +59: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +59: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +59: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 10:58:45,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 10:58:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +18: [2023-04-29 10:58:45,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:45,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:45,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 10:58:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +22: [2023-04-29 10:58:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 10:58:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 10:58:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:45,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:45,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 10:58:45,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 10:58:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +22: [2023-04-29 10:58:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +44: [2023-04-29 10:58:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:45,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +31: [2023-04-29 10:58:45,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 10:58:45,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 10:58:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 10:58:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:45,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +44: [2023-04-29 10:58:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:45,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:45,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:45,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 10:58:45,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 10:58:45,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:45,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +22: [2023-04-29 10:58:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 10:58:45,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 10:58:45,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +38: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 10:58:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:45,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 10:58:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:45,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 10:58:45,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:45,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 10:58:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 10:58:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 10:58:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +48: [2023-04-29 10:58:45,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:45,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +42: [2023-04-29 10:58:45,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 10:58:45,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:45,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:45,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 10:58:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 10:58:45,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:45,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +11: [2023-04-29 10:58:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:45,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +31: [2023-04-29 10:58:45,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:45,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +27: [2023-04-29 10:58:45,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 10:58:45,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 10:58:45,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +55: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +55: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +31: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 10:58:45,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 10:58:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +27: [2023-04-29 10:58:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 10:58:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +27: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +29: [2023-04-29 10:58:45,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:45,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 10:58:45,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 10:58:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 10:58:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 10:58:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +29: [2023-04-29 10:58:45,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 10:58:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +24: [2023-04-29 10:58:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +18: [2023-04-29 10:58:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +29: [2023-04-29 10:58:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:45,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 10:58:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +24: [2023-04-29 10:58:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +18: [2023-04-29 10:58:45,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:45,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 10:58:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 10:58:45,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 10:58:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 10:58:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 10:58:45,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 10:58:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 10:58:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 10:58:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 10:58:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 10:58:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +29: [2023-04-29 10:58:45,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 10:58:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 10:58:45,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 10:58:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +55: [2023-04-29 10:58:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +34: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 10:58:45,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 10:58:45,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:45,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 10:58:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:45,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:45,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 10:58:45,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 10:58:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +18: [2023-04-29 10:58:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +55: [2023-04-29 10:58:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +55: [2023-04-29 10:58:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +55: [2023-04-29 10:58:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 10:58:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 10:58:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 10:58:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +29: [2023-04-29 10:58:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 10:58:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 10:58:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 10:58:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 10:58:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 10:58:45,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 10:58:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 10:58:45,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +31: [2023-04-29 10:58:45,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:45,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 10:58:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 10:58:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 10:58:45,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 10:58:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +38: [2023-04-29 10:58:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 10:58:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +38: [2023-04-29 10:58:45,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +38: [2023-04-29 10:58:45,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 10:58:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 10:58:45,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +38: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +34: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +25: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 10:58:45,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 10:58:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +38: [2023-04-29 10:58:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +16: [2023-04-29 10:58:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +16: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 10:58:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 10:58:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 10:58:45,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +27: [2023-04-29 10:58:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 10:58:45,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:45,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 10:58:45,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 10:58:45,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 10:58:45,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:45,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 10:58:45,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 10:58:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 10:58:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 10:58:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 10:58:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +29: [2023-04-29 10:58:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 10:58:45,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:45,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 10:58:45,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 10:58:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 10:58:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 10:58:45,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 10:58:45,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 10:58:45,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 10:58:45,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +32: [2023-04-29 10:58:45,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:45,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:45,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:45,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:45,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 10:58:45,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 10:58:45,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 10:58:45,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 10:58:45,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +29: [2023-04-29 10:58:45,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +17: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 10:58:45,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 10:58:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 10:58:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:45,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +55: [2023-04-29 10:58:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +25: [2023-04-29 10:58:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 10:58:45,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 10:58:45,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 10:58:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 10:58:45,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 10:58:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 10:58:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 10:58:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 10:58:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +34: [2023-04-29 10:58:45,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 10:58:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:45,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +19: [2023-04-29 10:58:45,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +37: [2023-04-29 10:58:45,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 10:58:45,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +19: [2023-04-29 10:58:45,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +56: [2023-04-29 10:58:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +27: [2023-04-29 10:58:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 10:58:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +27: [2023-04-29 10:58:45,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 10:58:45,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +27: [2023-04-29 10:58:45,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 10:58:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +27: [2023-04-29 10:58:45,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 10:58:45,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 10:58:45,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:45,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:45,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 10:58:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 10:58:45,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +35: [2023-04-29 10:58:45,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +37: [2023-04-29 10:58:45,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 10:58:45,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +55: [2023-04-29 10:58:45,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 10:58:45,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +39: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 6: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +55: [2023-04-29 10:58:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +29: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 0: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:45,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:45,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 10:58:45,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +44: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +56: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +14: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 10:58:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 10:58:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 10:58:45,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 10:58:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 10:58:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 10:58:45,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:45,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 10:58:45,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +44: [2023-04-29 10:58:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 10:58:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:45,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 10:58:45,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:45,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +55: [2023-04-29 10:58:45,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 10:58:45,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +63: [2023-04-29 10:58:45,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:45,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:45,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 10:58:45,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 10:58:45,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +10: [2023-04-29 10:58:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +51: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +51: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +51: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 10:58:45,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +58: [2023-04-29 10:58:45,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +10: [2023-04-29 10:58:45,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +58: [2023-04-29 10:58:45,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 10:58:45,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +10: [2023-04-29 10:58:45,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +10: [2023-04-29 10:58:45,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +58: [2023-04-29 10:58:45,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +13: [2023-04-29 10:58:45,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 10:58:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 0: [2023-04-29 10:58:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 10:58:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +13: [2023-04-29 10:58:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 10:58:45,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 10:58:45,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +25: [2023-04-29 10:58:45,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 10:58:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 10:58:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 10:58:45,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +30: [2023-04-29 10:58:45,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:45,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:45,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +56: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 10:58:45,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +25: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 10:58:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 10:58:45,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 10:58:45,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:45,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 10:58:45,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 10:58:45,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +34: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +63: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 10:58:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 10:58:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +16: [2023-04-29 10:58:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +55: [2023-04-29 10:58:45,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +56: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +53: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 10:58:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +60: [2023-04-29 10:58:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 10:58:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:45,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +21: [2023-04-29 10:58:45,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:45,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +46: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +21: [2023-04-29 10:58:45,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 10:58:45,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +37: [2023-04-29 10:58:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +51: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +54: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 10:58:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +21: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +40: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +30: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +30: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 10:58:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +40: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 10:58:45,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +54: [2023-04-29 10:58:45,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 10:58:45,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 10:58:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:45,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 10:58:45,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 10:58:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 10:58:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +19: [2023-04-29 10:58:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +28: [2023-04-29 10:58:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 10:58:45,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +30: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +54: [2023-04-29 10:58:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +54: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +36: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +14: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +48: [2023-04-29 10:58:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:45,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +28: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +56: [2023-04-29 10:58:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +19: [2023-04-29 10:58:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +30: [2023-04-29 10:58:45,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +19: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +52: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 10:58:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 10:58:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +47: [2023-04-29 10:58:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +19: [2023-04-29 10:58:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +12: [2023-04-29 10:58:45,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 10:58:45,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 10:58:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 10:58:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +33: [2023-04-29 10:58:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +30: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +37: [2023-04-29 10:58:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +19: [2023-04-29 10:58:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +56: [2023-04-29 10:58:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +19: [2023-04-29 10:58:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +37: [2023-04-29 10:58:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 10:58:45,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 10:58:45,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 10:58:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 10:58:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 10:58:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 10:58:45,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:45,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:45,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:45,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 10:58:45,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +56: [2023-04-29 10:58:45,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 10:58:45,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 10:58:45,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:45,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:45,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 10:58:45,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:45,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:45,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 10:58:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 10:58:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 10:58:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 10:58:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 10:58:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +56: [2023-04-29 10:58:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 10:58:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 10:58:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 10:58:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 10:58:45,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 10:58:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 10:58:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 10:58:45,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 10:58:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:45,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 10:58:45,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 10:58:45,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 10:58:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:45,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:45,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 10:58:45,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 10:58:45,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:45,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 10:58:45,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:45,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 10:58:45,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:45,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 10:58:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:45,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 10:58:45,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +56: [2023-04-29 10:58:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +63: [2023-04-29 10:58:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:45,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 10:58:45,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:45,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +58: [2023-04-29 10:58:45,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +58: [2023-04-29 10:58:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +30: [2023-04-29 10:58:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 10:58:45,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 0: [2023-04-29 10:58:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 10:58:45,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. + 0: [2023-04-29 10:58:45,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 10:58:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 10:58:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 10:58:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 10:58:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 10:58:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 10:58:45,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +63: [2023-04-29 10:58:45,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 10:58:45,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 10:58:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +63: [2023-04-29 10:58:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 10:58:45,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 10:58:45,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 10:58:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 10:58:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 10:58:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 10:58:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 10:58:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 10:58:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 10:58:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +30: [2023-04-29 10:58:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 10:58:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 10:58:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:45,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 10:58:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:45,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 10:58:45,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 10:58:45,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 10:58:45,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:45,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:45,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:45,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:45,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:45,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +11: [2023-04-29 10:58:45,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 10:58:45,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 10:58:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 10:58:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 10:58:45,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 10:58:45,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 10:58:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 10:58:45,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 10:58:45,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... + 4: [2023-04-29 10:58:45,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +59: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 10:58:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 10:58:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 10:58:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 10:58:45,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +34: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +50: [2023-04-29 10:58:45,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 10:58:45,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 10:58:45,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:45,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +62: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:45,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +42: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +53: [2023-04-29 10:58:45,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:45,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:45,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +43: [2023-04-29 10:58:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +43: [2023-04-29 10:58:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 10:58:45,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +43: [2023-04-29 10:58:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 10:58:45,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 10:58:45,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 10:58:45,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:45,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +50: [2023-04-29 10:58:45,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:45,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 10:58:45,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 10:58:45,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 10:58:45,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 10:58:45,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 10:58:45,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +16: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +16: [2023-04-29 10:58:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +45: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +45: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +16: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +61: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +14: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +14: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 10:58:45,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt... +43: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 10:58:45,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 10:58:45,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 10:58:45,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 10:58:45,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +36: [2023-04-29 10:58:45,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 10:58:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 4: [2023-04-29 10:58:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 10:58:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 10:58:45,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 0: [2023-04-29 10:58:45,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 10:58:45,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:45,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 10:58:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 10:58:45,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +40: [2023-04-29 10:58:45,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 10:58:45,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 10:58:45,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +45: [2023-04-29 10:58:45,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 10:58:45,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +15: [2023-04-29 10:58:45,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 10:58:45,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 10:58:45,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 10:58:45,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 10:58:45,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:45,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 10:58:45,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 10:58:45,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +11: [2023-04-29 10:58:45,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 10:58:45,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 10:58:45,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 10:58:45,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +42: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 10:58:45,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 10:58:45,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 10:58:45,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 10:58:45,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +62: [2023-04-29 10:58:45,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 10:58:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:45,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 10:58:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 10:58:45,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +51: [2023-04-29 10:58:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +42: [2023-04-29 10:58:45,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 10:58:45,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 10:58:45,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +40: [2023-04-29 10:58:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:45,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 10:58:45,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 10:58:45,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 10:58:45,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 10:58:45,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 10:58:45,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 10:58:45,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 10:58:45,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +22: [2023-04-29 10:58:45,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +50: [2023-04-29 10:58:45,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 10:58:45,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 10:58:45,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +51: [2023-04-29 10:58:45,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 10:58:45,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +50: [2023-04-29 10:58:45,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 10:58:45,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 10:58:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 10:58:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 10:58:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +14: [2023-04-29 10:58:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +61: [2023-04-29 10:58:45,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +50: [2023-04-29 10:58:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +50: [2023-04-29 10:58:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 10:58:45,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 10:58:45,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 10:58:45,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:45,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 10:58:45,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +14: [2023-04-29 10:58:45,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +61: [2023-04-29 10:58:45,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 10:58:45,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 10:58:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +26: [2023-04-29 10:58:45,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +26: [2023-04-29 10:58:45,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +26: [2023-04-29 10:58:45,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +43: [2023-04-29 10:58:45,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 10:58:45,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 10:58:45,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 10:58:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:45,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:45,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 10:58:45,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 10:58:45,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 10:58:45,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 10:58:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:45,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:45,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 10:58:45,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 10:58:45,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:45,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 10:58:45,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:45,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 10:58:45,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 10:58:45,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 10:58:45,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:45,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 10:58:45,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +12: [2023-04-29 10:58:45,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 10:58:45,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 10:58:45,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +12: [2023-04-29 10:58:45,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 10:58:45,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +26: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 10:58:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 10:58:45,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 10:58:45,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 10:58:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 10:58:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 10:58:45,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:45,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 10:58:45,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 10:58:45,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +47: [2023-04-29 10:58:45,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:45,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 10:58:45,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 10:58:45,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:45,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 10:58:45,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +12: [2023-04-29 10:58:45,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +47: [2023-04-29 10:58:45,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:45,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:45,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:45,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 10:58:45,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 10:58:45,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 10:58:45,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 10:58:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +15: [2023-04-29 10:58:45,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 5: [2023-04-29 10:58:45,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 5: [2023-04-29 10:58:45,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 5: [2023-04-29 10:58:45,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 10:58:45,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:45,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:45,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +13: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +44: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +13: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 10:58:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 10:58:45,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt. +19: [2023-04-29 10:58:45,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:45,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:45,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 10:58:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 10:58:45,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 10:58:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 10:58:45,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:45,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:45,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 10:58:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:45,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 10:58:45,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 10:58:45,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 10:58:45,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:45,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 10:58:45,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:45,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:45,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 10:58:45,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 10:58:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 10:58:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +26: [2023-04-29 10:58:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 10:58:45,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 10:58:45,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 10:58:45,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +26: [2023-04-29 10:58:45,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 10:58:45,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 10:58:45,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 10:58:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:45,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 10:58:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 10:58:45,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 10:58:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 10:58:45,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 10:58:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:45,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +48: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 10:58:45,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +21: [2023-04-29 10:58:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 10:58:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +21: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +21: [2023-04-29 10:58:45,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 10:58:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +26: [2023-04-29 10:58:45,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 10:58:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 10:58:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +26: [2023-04-29 10:58:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +52: [2023-04-29 10:58:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +52: [2023-04-29 10:58:45,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 10:58:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 10:58:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 10:58:45,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +52: [2023-04-29 10:58:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +26: [2023-04-29 10:58:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +52: [2023-04-29 10:58:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 10:58:45,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +26: [2023-04-29 10:58:45,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 10:58:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 10:58:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 10:58:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 10:58:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +47: [2023-04-29 10:58:45,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 10:58:45,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +48: [2023-04-29 10:58:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 10:58:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 10:58:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 10:58:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +48: [2023-04-29 10:58:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 10:58:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 10:58:45,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 10:58:45,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 10:58:45,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 10:58:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:45,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +55: [2023-04-29 10:58:45,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +55: [2023-04-29 10:58:45,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +55: [2023-04-29 10:58:45,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 10:58:45,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 10:58:45,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +19: [2023-04-29 10:58:45,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 10:58:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 10:58:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 10:58:45,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 10:58:45,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 10:58:45,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 10:58:45,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 10:58:45,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 10:58:45,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 10:58:45,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +15: [2023-04-29 10:58:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 10:58:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 10:58:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 10:58:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +44: [2023-04-29 10:58:45,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +26: [2023-04-29 10:58:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +54: [2023-04-29 10:58:45,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 10:58:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 10:58:45,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 10:58:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +13: [2023-04-29 10:58:45,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +13: [2023-04-29 10:58:45,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +26: [2023-04-29 10:58:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 10:58:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt... +19: [2023-04-29 10:58:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:45,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 10:58:45,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +19: [2023-04-29 10:58:45,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 10:58:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 10:58:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 10:58:45,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +44: [2023-04-29 10:58:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 10:58:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +19: [2023-04-29 10:58:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 10:58:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +15: [2023-04-29 10:58:45,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 10:58:45,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:45,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:45,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +21: [2023-04-29 10:58:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:45,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 10:58:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 10:58:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 10:58:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 10:58:45,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 10:58:45,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +21: [2023-04-29 10:58:45,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 10:58:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 10:58:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 10:58:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:45,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:45,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +26: [2023-04-29 10:58:45,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 10:58:45,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +48: [2023-04-29 10:58:45,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 3: [2023-04-29 10:58:45,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +35: [2023-04-29 10:58:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +35: [2023-04-29 10:58:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +35: [2023-04-29 10:58:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +35: [2023-04-29 10:58:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 10:58:45,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 3: [2023-04-29 10:58:45,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:45,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +42: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 10:58:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +21: [2023-04-29 10:58:45,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:45,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:45,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 10:58:45,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 10:58:45,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 10:58:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 10:58:45,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 10:58:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 10:58:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 10:58:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +43: [2023-04-29 10:58:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +43: [2023-04-29 10:58:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +43: [2023-04-29 10:58:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 10:58:45,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 10:58:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +55: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 10:58:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +35: [2023-04-29 10:58:45,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:45,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:45,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:45,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:45,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:45,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 10:58:45,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +10: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +10: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +10: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 10:58:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 10:58:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 10:58:45,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +39: [2023-04-29 10:58:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 10:58:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +27: [2023-04-29 10:58:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +27: [2023-04-29 10:58:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +27: [2023-04-29 10:58:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 10:58:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +32: [2023-04-29 10:58:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +27: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +39: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 10:58:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:45,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 10:58:45,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 10:58:45,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +32: [2023-04-29 10:58:45,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 10:58:45,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +33: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +33: [2023-04-29 10:58:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 10:58:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 10:58:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 10:58:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 10:58:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +22: [2023-04-29 10:58:45,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 10:58:45,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:45,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 10:58:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 10:58:45,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 3: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 10:58:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +15: [2023-04-29 10:58:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +55: [2023-04-29 10:58:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 10:58:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +22: [2023-04-29 10:58:45,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 10:58:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 10:58:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 10:58:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 10:58:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +40: [2023-04-29 10:58:45,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 10:58:45,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 10:58:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 10:58:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +17: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +45: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +45: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +10: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +45: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +10: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +17: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:45,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 8: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:45,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +27: [2023-04-29 10:58:45,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 10:58:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 10:58:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 10:58:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 10:58:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 10:58:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 10:58:45,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +27: [2023-04-29 10:58:45,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 10:58:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 10:58:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:45,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:45,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:45,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:45,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +29: [2023-04-29 10:58:45,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +59: [2023-04-29 10:58:45,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:45,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +29: [2023-04-29 10:58:45,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +62: [2023-04-29 10:58:45,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 10:58:45,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:45,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:45,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +57: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 10:58:45,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +17: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +17: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:45,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:45,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:45,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +45: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 10:58:45,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 10:58:45,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 10:58:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 10:58:45,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 10:58:45,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:45,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:45,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +37: [2023-04-29 10:58:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +37: [2023-04-29 10:58:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 10:58:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 10:58:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 10:58:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +37: [2023-04-29 10:58:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 10:58:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 10:58:45,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 10:58:45,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +57: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +19: [2023-04-29 10:58:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 10:58:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:45,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:45,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 5: [2023-04-29 10:58:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +50: [2023-04-29 10:58:45,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:45,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:45,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +50: [2023-04-29 10:58:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 10:58:45,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 10:58:45,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:45,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:45,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 10:58:45,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:45,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 10:58:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 10:58:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 10:58:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 10:58:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 6: [2023-04-29 10:58:45,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 10:58:45,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 10:58:45,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 10:58:45,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +61: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +61: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +61: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:45,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 10:58:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 10:58:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:45,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:45,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 10:58:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +49: [2023-04-29 10:58:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:45,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 10:58:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 10:58:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 10:58:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 10:58:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +52: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +52: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +52: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +19: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 10:58:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +38: [2023-04-29 10:58:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 10:58:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:45,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +32: [2023-04-29 10:58:45,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 10:58:45,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +32: [2023-04-29 10:58:45,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 10:58:45,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 10:58:45,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 10:58:45,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:45,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:45,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 10:58:45,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 10:58:45,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:45,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 10:58:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 10:58:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 10:58:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 10:58:45,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +45: [2023-04-29 10:58:45,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +45: [2023-04-29 10:58:45,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +34: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 10:58:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:45,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +34: [2023-04-29 10:58:45,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +18: [2023-04-29 10:58:45,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 10:58:45,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 10:58:45,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +51: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 10:58:45,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 10:58:45,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:45,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 10:58:45,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 10:58:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 10:58:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 10:58:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 10:58:45,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:45,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +18: [2023-04-29 10:58:45,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 10:58:45,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 10:58:45,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:45,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:45,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +48: [2023-04-29 10:58:45,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 10:58:45,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 9: [2023-04-29 10:58:45,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 10:58:45,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +48: [2023-04-29 10:58:45,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 10:58:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 10:58:45,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +44: [2023-04-29 10:58:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 10:58:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 10:58:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 10:58:45,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 10:58:45,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +23: [2023-04-29 10:58:45,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 10:58:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 10:58:45,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +21: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +21: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +34: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +21: [2023-04-29 10:58:45,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +34: [2023-04-29 10:58:45,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:45,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:45,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 10:58:45,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:45,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +42: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +51: [2023-04-29 10:58:45,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:45,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:45,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:45,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +19: [2023-04-29 10:58:45,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 10:58:45,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:45,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +56: [2023-04-29 10:58:45,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +56: [2023-04-29 10:58:45,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +56: [2023-04-29 10:58:45,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 10:58:45,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +42: [2023-04-29 10:58:45,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 10:58:45,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +31: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +48: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +25: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +49: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +42: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +42: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +47: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +60: [2023-04-29 10:58:45,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:45,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +20: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +31: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +31: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +58: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +49: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 10:58:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +58: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +28: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +44: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +37: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +60: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +60: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +11: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +11: [2023-04-29 10:58:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +11: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +49: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 10:58:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +30: [2023-04-29 10:58:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +30: [2023-04-29 10:58:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +38: [2023-04-29 10:58:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +28: [2023-04-29 10:58:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 10:58:45,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +28: [2023-04-29 10:58:45,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 10:58:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +21: [2023-04-29 10:58:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:45,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:45,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 10:58:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +19: [2023-04-29 10:58:45,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 10:58:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 10:58:45,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 10:58:45,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 10:58:45,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +29: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +29: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +55: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +11: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 7: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 10:58:45,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +55: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 10:58:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 10:58:45,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +38: [2023-04-29 10:58:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +30: [2023-04-29 10:58:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:45,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:45,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 10:58:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 10:58:45,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 10:58:45,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +38: [2023-04-29 10:58:45,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:45,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:45,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 10:58:45,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +38: [2023-04-29 10:58:45,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 10:58:45,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +34: [2023-04-29 10:58:45,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +28: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +28: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +28: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +38: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 10:58:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +34: [2023-04-29 10:58:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 10:58:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:45,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:45,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 10:58:45,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +17: [2023-04-29 10:58:45,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +34: [2023-04-29 10:58:45,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +17: [2023-04-29 10:58:45,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +17: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 8: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +17: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 8: [2023-04-29 10:58:45,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:45,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +42: [2023-04-29 10:58:45,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 10:58:45,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 10:58:45,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 10:58:45,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 10:58:45,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +42: [2023-04-29 10:58:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +24: [2023-04-29 10:58:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 10:58:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +55: [2023-04-29 10:58:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 10:58:45,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 10:58:45,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:45,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:45,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:45,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 10:58:45,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +21: [2023-04-29 10:58:45,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:45,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +41: [2023-04-29 10:58:45,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 10:58:45,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +28: [2023-04-29 10:58:45,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:45,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 10:58:45,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 10:58:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 10:58:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 10:58:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:45,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:45,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 10:58:45,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 10:58:45,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 10:58:45,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +21: [2023-04-29 10:58:45,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 10:58:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +21: [2023-04-29 10:58:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 10:58:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +28: [2023-04-29 10:58:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:45,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +21: [2023-04-29 10:58:45,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +35: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 4: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +35: [2023-04-29 10:58:45,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +21: [2023-04-29 10:58:45,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +28: [2023-04-29 10:58:45,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:45,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 10:58:45,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 10:58:45,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:45,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 10:58:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:45,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:45,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 10:58:45,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 10:58:45,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 10:58:45,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:45,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +29: [2023-04-29 10:58:45,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:45,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +25: [2023-04-29 10:58:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +56: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +20: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 10:58:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +41: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +43: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +43: [2023-04-29 10:58:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +31: [2023-04-29 10:58:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +25: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +55: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +29: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +54: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +54: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 10:58:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +54: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +54: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +54: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 2: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 2: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:45,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 10:58:45,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +25: [2023-04-29 10:58:45,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +25: [2023-04-29 10:58:45,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +31: [2023-04-29 10:58:45,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +35: [2023-04-29 10:58:45,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +62: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:45,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 10:58:45,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:45,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 10:58:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 10:58:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 10:58:45,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +28: [2023-04-29 10:58:45,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:45,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 10:58:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 10:58:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 10:58:45,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:45,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 10:58:45,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:45,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +33: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 2: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +53: [2023-04-29 10:58:45,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 10:58:45,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 10:58:45,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:45,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +32: [2023-04-29 10:58:45,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:45,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:45,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 10:58:45,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +51: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +32: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +17: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 10:58:45,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt. + 8: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 10:58:45,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +49: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:45,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 10:58:45,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 10:58:45,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:45,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:45,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:45,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:45,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:45,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +38: [2023-04-29 10:58:45,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:45,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 10:58:45,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 10:58:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 10:58:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:45,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 10:58:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 10:58:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +29: [2023-04-29 10:58:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:46,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 10:58:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:46,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:46,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 10:58:46,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:46,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 10:58:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 10:58:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:46,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +24: [2023-04-29 10:58:46,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +33: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +33: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +26: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +38: [2023-04-29 10:58:46,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:46,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +13: [2023-04-29 10:58:46,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 10:58:46,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 10:58:46,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 10:58:46,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +55: [2023-04-29 10:58:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +28: [2023-04-29 10:58:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +28: [2023-04-29 10:58:46,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 10:58:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:46,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:46,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 10:58:46,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 10:58:46,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 10:58:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +58: [2023-04-29 10:58:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +16: [2023-04-29 10:58:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:46,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +16: [2023-04-29 10:58:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 10:58:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 10:58:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +28: [2023-04-29 10:58:46,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:46,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +51: [2023-04-29 10:58:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 10:58:46,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:46,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:46,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:46,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 10:58:46,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 10:58:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 10:58:46,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 10:58:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +53: [2023-04-29 10:58:46,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 10:58:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +40: [2023-04-29 10:58:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 10:58:46,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +54: [2023-04-29 10:58:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 10:58:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +41: [2023-04-29 10:58:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 10:58:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 10:58:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +59: [2023-04-29 10:58:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +59: [2023-04-29 10:58:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +53: [2023-04-29 10:58:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +30: [2023-04-29 10:58:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +14: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt. +30: [2023-04-29 10:58:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +30: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 10:58:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +41: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +13: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 10:58:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 10:58:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 10:58:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 10:58:46,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +46: [2023-04-29 10:58:46,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +46: [2023-04-29 10:58:46,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +41: [2023-04-29 10:58:46,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +58: [2023-04-29 10:58:46,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:46,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +41: [2023-04-29 10:58:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +12: [2023-04-29 10:58:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 10:58:46,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 10:58:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:46,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 10:58:46,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 10:58:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 10:58:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 10:58:46,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 10:58:46,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:46,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +12: [2023-04-29 10:58:46,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 10:58:46,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:46,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +54: [2023-04-29 10:58:46,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +36: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +12: [2023-04-29 10:58:46,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 10:58:46,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +49: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +49: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. + 2: [2023-04-29 10:58:46,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +54: [2023-04-29 10:58:46,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:46,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 10:58:46,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:46,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 10:58:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 10:58:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 10:58:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:46,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 10:58:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +47: [2023-04-29 10:58:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 10:58:46,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +41: [2023-04-29 10:58:46,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +47: [2023-04-29 10:58:46,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +12: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +12: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +63: [2023-04-29 10:58:46,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +60: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +60: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +12: [2023-04-29 10:58:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +51: [2023-04-29 10:58:46,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 10:58:46,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 10:58:46,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:46,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +63: [2023-04-29 10:58:46,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 10:58:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 10:58:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 10:58:46,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 10:58:46,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 10:58:46,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 10:58:46,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 10:58:46,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +24: [2023-04-29 10:58:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +41: [2023-04-29 10:58:46,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 10:58:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 10:58:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 10:58:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 10:58:46,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:46,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 10:58:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +51: [2023-04-29 10:58:46,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 10:58:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 10:58:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 10:58:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 10:58:46,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 10:58:46,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +51: [2023-04-29 10:58:46,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... +30: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +41: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +51: [2023-04-29 10:58:46,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 10:58:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 10:58:46,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +32: [2023-04-29 10:58:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +30: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +32: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +32: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 10:58:46,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 10:58:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +34: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +14: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +46: [2023-04-29 10:58:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 10:58:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +34: [2023-04-29 10:58:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +14: [2023-04-29 10:58:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 10:58:46,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 10:58:46,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +36: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 10:58:46,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 10:58:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 10:58:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 10:58:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 10:58:46,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 10:58:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 10:58:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 10:58:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +46: [2023-04-29 10:58:46,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 10:58:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +49: [2023-04-29 10:58:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +12: [2023-04-29 10:58:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:46,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +50: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 10:58:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 10:58:46,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 10:58:46,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 10:58:46,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:46,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 10:58:46,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 10:58:46,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 10:58:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +49: [2023-04-29 10:58:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 10:58:46,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 10:58:46,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +10: [2023-04-29 10:58:46,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +49: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 3: [2023-04-29 10:58:46,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +33: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 10:58:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +49: [2023-04-29 10:58:46,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +32: [2023-04-29 10:58:46,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +37: [2023-04-29 10:58:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +57: [2023-04-29 10:58:46,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 10:58:46,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 10:58:46,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +57: [2023-04-29 10:58:46,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 10:58:46,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +57: [2023-04-29 10:58:46,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 10:58:46,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 10:58:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 10:58:46,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 10:58:46,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 10:58:46,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 10:58:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 10:58:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 10:58:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 10:58:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +22: [2023-04-29 10:58:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:46,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:46,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 10:58:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 10:58:46,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:46,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:46,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 10:58:46,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +20: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 10:58:46,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 10:58:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:46,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 10:58:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:46,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 10:58:46,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 10:58:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 10:58:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +35: [2023-04-29 10:58:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 10:58:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 10:58:46,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 10:58:46,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 10:58:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 10:58:46,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 10:58:46,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +10: [2023-04-29 10:58:46,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 10:58:46,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:46,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +56: [2023-04-29 10:58:46,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 10:58:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:46,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 10:58:46,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 10:58:46,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 10:58:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 10:58:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 10:58:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 10:58:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +21: [2023-04-29 10:58:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 10:58:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 10:58:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 10:58:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +57: [2023-04-29 10:58:46,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +45: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:46,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 10:58:46,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +21: [2023-04-29 10:58:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +21: [2023-04-29 10:58:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 10:58:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 10:58:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +23: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +48: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +48: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +48: [2023-04-29 10:58:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +56: [2023-04-29 10:58:46,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +53: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +53: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +53: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 10:58:46,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 10:58:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +61: [2023-04-29 10:58:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +48: [2023-04-29 10:58:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 10:58:46,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 10:58:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +61: [2023-04-29 10:58:46,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 10:58:46,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +53: [2023-04-29 10:58:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 10:58:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +35: [2023-04-29 10:58:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +53: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 10:58:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +11: [2023-04-29 10:58:46,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +35: [2023-04-29 10:58:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 10:58:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +59: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 10:58:46,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 10:58:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +40: [2023-04-29 10:58:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:46,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +22: [2023-04-29 10:58:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 10:58:46,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +53: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +11: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +20: [2023-04-29 10:58:46,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 10:58:46,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +11: [2023-04-29 10:58:46,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 10:58:46,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +57: [2023-04-29 10:58:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 10:58:46,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:46,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 10:58:46,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 10:58:46,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:46,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +23: [2023-04-29 10:58:46,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 10:58:46,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +20: [2023-04-29 10:58:46,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 10:58:46,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +23: [2023-04-29 10:58:46,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 10:58:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 10:58:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:46,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 10:58:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:46,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 10:58:46,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:46,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 10:58:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +60: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +27: [2023-04-29 10:58:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +15: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +60: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 10:58:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:46,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +15: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 10:58:46,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 10:58:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +41: [2023-04-29 10:58:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 10:58:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 10:58:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 10:58:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 10:58:46,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +57: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 10:58:46,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 10:58:46,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +22: [2023-04-29 10:58:46,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 10:58:46,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 10:58:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +22: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 10:58:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 10:58:46,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 10:58:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 10:58:46,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +23: [2023-04-29 10:58:46,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 10:58:46,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 10:58:46,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +16: [2023-04-29 10:58:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 10:58:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +16: [2023-04-29 10:58:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +47: [2023-04-29 10:58:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +47: [2023-04-29 10:58:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 10:58:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +51: [2023-04-29 10:58:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 10:58:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 10:58:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +47: [2023-04-29 10:58:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +16: [2023-04-29 10:58:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +61: [2023-04-29 10:58:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 10:58:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 10:58:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +47: [2023-04-29 10:58:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +47: [2023-04-29 10:58:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 10:58:46,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 10:58:46,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 10:58:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 10:58:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 3: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 3: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 3: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:46,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +11: [2023-04-29 10:58:46,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 10:58:46,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:46,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 10:58:46,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 10:58:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 10:58:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 10:58:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +48: [2023-04-29 10:58:46,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 10:58:46,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:46,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:46,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 10:58:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +61: [2023-04-29 10:58:46,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:46,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 10:58:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +60: [2023-04-29 10:58:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 10:58:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +39: [2023-04-29 10:58:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 10:58:46,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +60: [2023-04-29 10:58:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +21: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +39: [2023-04-29 10:58:46,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 10:58:46,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 10:58:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:46,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 10:58:46,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +62: [2023-04-29 10:58:46,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +23: [2023-04-29 10:58:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 10:58:46,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +13: [2023-04-29 10:58:46,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:46,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +39: [2023-04-29 10:58:46,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +53: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 10:58:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 10:58:46,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 10:58:46,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +23: [2023-04-29 10:58:46,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +39: [2023-04-29 10:58:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:46,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 10:58:46,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +13: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +53: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +15: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +53: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +21: [2023-04-29 10:58:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +15: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +13: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +13: [2023-04-29 10:58:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:46,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 10:58:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +60: [2023-04-29 10:58:46,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 10:58:46,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 10:58:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:46,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +19: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 10:58:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 10:58:46,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +39: [2023-04-29 10:58:46,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 10:58:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 10:58:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 5: [2023-04-29 10:58:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +60: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +26: [2023-04-29 10:58:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 10:58:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 10:58:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:46,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +16: [2023-04-29 10:58:46,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 10:58:46,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 10:58:46,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 10:58:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +53: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 10:58:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 10:58:46,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 10:58:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:46,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 10:58:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +21: [2023-04-29 10:58:46,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +47: [2023-04-29 10:58:46,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 10:58:46,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +17: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +17: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +17: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +42: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +42: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +42: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +42: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +55: [2023-04-29 10:58:46,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 10:58:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +47: [2023-04-29 10:58:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 10:58:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 10:58:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 10:58:46,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 10:58:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +31: [2023-04-29 10:58:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +31: [2023-04-29 10:58:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +31: [2023-04-29 10:58:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +45: [2023-04-29 10:58:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 10:58:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 10:58:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 10:58:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 10:58:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +23: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 10:58:46,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 10:58:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +23: [2023-04-29 10:58:46,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:46,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:46,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 10:58:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +15: [2023-04-29 10:58:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:46,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:46,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +17: [2023-04-29 10:58:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +47: [2023-04-29 10:58:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +17: [2023-04-29 10:58:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +42: [2023-04-29 10:58:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +17: [2023-04-29 10:58:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 10:58:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +31: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 10:58:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 10:58:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 10:58:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +13: [2023-04-29 10:58:46,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 10:58:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +59: [2023-04-29 10:58:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +26: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +44: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +44: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +26: [2023-04-29 10:58:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +15: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 10:58:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 10:58:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 10:58:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +29: [2023-04-29 10:58:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 10:58:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 10:58:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 10:58:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 10:58:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 10:58:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 10:58:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 10:58:46,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +15: [2023-04-29 10:58:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 10:58:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 10:58:46,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 10:58:46,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:46,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 10:58:46,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +19: [2023-04-29 10:58:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +55: [2023-04-29 10:58:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +19: [2023-04-29 10:58:46,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +55: [2023-04-29 10:58:46,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +19: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 10:58:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 10:58:46,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +25: [2023-04-29 10:58:46,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 10:58:46,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +51: [2023-04-29 10:58:46,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +28: [2023-04-29 10:58:46,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +62: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +62: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +62: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +25: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +62: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +31: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +31: [2023-04-29 10:58:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 10:58:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 10:58:46,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 10:58:46,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 10:58:46,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +20: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +45: [2023-04-29 10:58:46,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +45: [2023-04-29 10:58:46,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +55: [2023-04-29 10:58:46,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +29: [2023-04-29 10:58:46,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:46,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +25: [2023-04-29 10:58:46,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 10:58:46,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 10:58:46,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 10:58:46,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 10:58:46,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 10:58:46,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 10:58:46,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +25: [2023-04-29 10:58:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +40: [2023-04-29 10:58:46,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 10:58:46,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 10:58:46,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 10:58:46,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +10: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +10: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 10:58:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 10:58:46,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 10:58:46,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 10:58:46,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 10:58:46,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +40: [2023-04-29 10:58:46,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt... +29: [2023-04-29 10:58:46,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 10:58:46,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:46,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:46,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +59: [2023-04-29 10:58:46,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 10:58:46,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:46,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +18: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:46,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +10: [2023-04-29 10:58:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 10:58:46,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:46,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 10:58:46,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 10:58:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 10:58:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +36: [2023-04-29 10:58:46,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 10:58:46,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 10:58:46,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +24: [2023-04-29 10:58:46,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 10:58:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 10:58:46,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:46,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 10:58:46,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 10:58:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +24: [2023-04-29 10:58:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 10:58:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 10:58:46,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +31: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 10:58:46,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +62: [2023-04-29 10:58:46,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:46,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +32: [2023-04-29 10:58:46,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 10:58:46,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +32: [2023-04-29 10:58:46,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +32: [2023-04-29 10:58:46,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 10:58:46,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 10:58:46,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +31: [2023-04-29 10:58:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 10:58:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +51: [2023-04-29 10:58:46,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 10:58:46,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 10:58:46,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +28: [2023-04-29 10:58:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 10:58:46,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 10:58:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 10:58:46,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +11: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +11: [2023-04-29 10:58:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +55: [2023-04-29 10:58:46,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:46,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +42: [2023-04-29 10:58:46,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +42: [2023-04-29 10:58:46,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +40: [2023-04-29 10:58:46,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 10:58:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +25: [2023-04-29 10:58:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +42: [2023-04-29 10:58:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 10:58:46,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +58: [2023-04-29 10:58:46,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 10:58:46,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +58: [2023-04-29 10:58:46,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +24: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +14: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +14: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +46: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +24: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +24: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +31: [2023-04-29 10:58:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +55: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +40: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 10:58:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 10:58:46,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +44: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:46,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +35: [2023-04-29 10:58:46,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +35: [2023-04-29 10:58:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 10:58:46,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 10:58:46,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 10:58:46,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:46,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +32: [2023-04-29 10:58:46,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 10:58:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +44: [2023-04-29 10:58:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +44: [2023-04-29 10:58:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:46,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:46,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 0: [2023-04-29 10:58:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 0: [2023-04-29 10:58:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +44: [2023-04-29 10:58:46,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +44: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +45: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:46,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +44: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 10:58:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +55: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +31: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:46,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +10: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:46,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 10:58:46,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 10:58:46,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 10:58:46,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 10:58:46,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 10:58:46,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:46,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 10:58:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 10:58:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 10:58:46,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 10:58:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 10:58:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:46,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:46,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:46,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:46,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:46,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 10:58:46,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 10:58:46,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 10:58:46,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +14: [2023-04-29 10:58:46,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 10:58:46,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 10:58:46,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 10:58:46,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 10:58:46,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 10:58:46,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +14: [2023-04-29 10:58:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 10:58:46,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +29: [2023-04-29 10:58:46,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 10:58:46,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:46,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 10:58:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 2: [2023-04-29 10:58:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +35: [2023-04-29 10:58:46,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 5: [2023-04-29 10:58:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +10: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +10: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +18: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 2: [2023-04-29 10:58:46,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 10:58:46,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 5: [2023-04-29 10:58:46,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 10:58:46,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +38: [2023-04-29 10:58:46,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:46,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +29: [2023-04-29 10:58:46,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 10:58:46,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 10:58:46,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +49: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 10:58:46,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +49: [2023-04-29 10:58:46,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 10:58:46,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 10:58:46,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +33: [2023-04-29 10:58:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +33: [2023-04-29 10:58:46,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +33: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +29: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +50: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +33: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +50: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +50: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +50: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +23: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:46,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 10:58:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 10:58:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 10:58:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +10: [2023-04-29 10:58:46,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 10:58:46,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:46,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 10:58:46,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:46,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +58: [2023-04-29 10:58:46,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 10:58:46,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +12: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +42: [2023-04-29 10:58:46,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +36: [2023-04-29 10:58:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +17: [2023-04-29 10:58:46,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 10:58:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +24: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +36: [2023-04-29 10:58:46,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 5: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 10:58:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +24: [2023-04-29 10:58:46,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 10:58:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 10:58:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 10:58:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +24: [2023-04-29 10:58:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 10:58:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 10:58:46,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +49: [2023-04-29 10:58:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 10:58:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 10:58:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 10:58:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +63: [2023-04-29 10:58:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +15: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +24: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +61: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +61: [2023-04-29 10:58:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +50: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +15: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 10:58:46,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +61: [2023-04-29 10:58:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 10:58:46,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +15: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 10:58:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 10:58:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 10:58:46,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 3: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +45: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:46,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 10:58:46,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +41: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +22: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +22: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +45: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:46,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:46,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:46,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 10:58:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 10:58:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 10:58:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 10:58:46,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +44: [2023-04-29 10:58:46,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +13: [2023-04-29 10:58:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 10:58:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +42: [2023-04-29 10:58:46,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 10:58:46,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:46,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +42: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 10:58:46,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +27: [2023-04-29 10:58:46,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 10:58:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 10:58:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 10:58:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 10:58:46,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:46,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 10:58:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 10:58:46,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 10:58:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:46,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 10:58:46,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:46,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:46,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:46,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 10:58:46,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:46,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 10:58:46,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:46,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:46,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 10:58:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 10:58:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +19: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +16: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +21: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +21: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +21: [2023-04-29 10:58:46,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +52: [2023-04-29 10:58:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 10:58:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 10:58:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 10:58:46,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +19: [2023-04-29 10:58:46,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +19: [2023-04-29 10:58:46,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 10:58:46,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 10:58:46,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 10:58:46,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 10:58:46,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:46,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 10:58:46,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +10: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 8: [2023-04-29 10:58:46,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 10:58:46,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +10: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 8: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 8: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 10:58:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +36: [2023-04-29 10:58:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 10:58:46,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 10:58:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +54: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 10:58:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 10:58:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 10:58:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 10:58:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +28: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 10:58:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 10:58:46,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 10:58:46,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 10:58:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 10:58:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 10:58:46,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 10:58:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:46,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 10:58:46,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 10:58:46,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:46,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:46,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +37: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +12: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 10:58:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:46,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +12: [2023-04-29 10:58:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 10:58:46,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +46: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 2: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +12: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +46: [2023-04-29 10:58:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 10:58:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 10:58:46,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 10:58:46,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 10:58:46,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +41: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +49: [2023-04-29 10:58:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 10:58:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 10:58:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 10:58:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 10:58:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 10:58:46,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 10:58:46,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +31: [2023-04-29 10:58:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 10:58:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 10:58:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 10:58:46,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 10:58:46,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 10:58:46,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 10:58:46,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 10:58:46,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +47: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +47: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 1: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 10:58:46,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 10:58:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 10:58:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 10:58:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 10:58:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 10:58:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 10:58:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 10:58:46,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +12: [2023-04-29 10:58:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 10:58:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 10:58:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 10:58:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 10:58:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 10:58:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 10:58:46,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 9: [2023-04-29 10:58:46,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 10:58:46,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 10:58:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 10:58:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 10:58:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +60: [2023-04-29 10:58:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 10:58:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 10:58:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +47: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 10:58:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:46,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:46,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 8: [2023-04-29 10:58:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +53: [2023-04-29 10:58:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +30: [2023-04-29 10:58:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 10:58:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 10:58:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 10:58:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +56: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 10:58:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 10:58:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 10:58:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +56: [2023-04-29 10:58:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:46,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +56: [2023-04-29 10:58:46,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +30: [2023-04-29 10:58:46,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 10:58:46,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 10:58:46,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 10:58:46,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 8: [2023-04-29 10:58:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:46,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:46,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +18: [2023-04-29 10:58:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +18: [2023-04-29 10:58:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +18: [2023-04-29 10:58:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +18: [2023-04-29 10:58:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:46,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:46,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 10:58:46,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +51: [2023-04-29 10:58:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +25: [2023-04-29 10:58:46,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +25: [2023-04-29 10:58:46,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +25: [2023-04-29 10:58:46,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +25: [2023-04-29 10:58:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +51: [2023-04-29 10:58:46,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 10:58:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +20: [2023-04-29 10:58:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +20: [2023-04-29 10:58:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +20: [2023-04-29 10:58:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +46: [2023-04-29 10:58:46,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 10:58:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +18: [2023-04-29 10:58:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 10:58:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 10:58:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +29: [2023-04-29 10:58:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 10:58:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 10:58:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 10:58:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +49: [2023-04-29 10:58:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +25: [2023-04-29 10:58:46,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 7: [2023-04-29 10:58:46,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:46,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 7: [2023-04-29 10:58:46,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 10:58:46,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 7: [2023-04-29 10:58:46,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 10:58:46,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 10:58:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 10:58:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 10:58:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +25: [2023-04-29 10:58:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +27: [2023-04-29 10:58:46,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +14: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:46,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 10:58:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 10:58:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 10:58:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 4: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 10:58:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +14: [2023-04-29 10:58:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 10:58:46,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 10:58:46,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +14: [2023-04-29 10:58:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +14: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +16: [2023-04-29 10:58:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 10:58:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 10:58:46,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +16: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 10:58:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +16: [2023-04-29 10:58:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 10:58:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 10:58:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 10:58:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 10:58:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 10:58:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 10:58:46,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:46,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:46,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 10:58:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +39: [2023-04-29 10:58:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +39: [2023-04-29 10:58:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +39: [2023-04-29 10:58:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +39: [2023-04-29 10:58:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:46,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +27: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 10:58:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +52: [2023-04-29 10:58:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +52: [2023-04-29 10:58:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 10:58:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +52: [2023-04-29 10:58:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 10:58:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +52: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +49: [2023-04-29 10:58:46,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:46,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:46,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 10:58:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +32: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +32: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 10:58:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 10:58:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +57: [2023-04-29 10:58:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +57: [2023-04-29 10:58:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +57: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:46,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 10:58:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 10:58:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 10:58:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 10:58:46,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:46,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:46,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:46,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:46,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:46,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 10:58:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 10:58:46,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 10:58:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +33: [2023-04-29 10:58:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +33: [2023-04-29 10:58:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:46,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 10:58:46,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +56: [2023-04-29 10:58:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 10:58:46,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +33: [2023-04-29 10:58:46,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 10:58:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 10:58:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 10:58:46,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 10:58:46,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:46,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 10:58:46,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 10:58:46,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 10:58:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 10:58:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 10:58:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +13: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 10:58:46,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 10:58:46,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 10:58:46,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 10:58:46,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 10:58:46,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 10:58:46,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +62: [2023-04-29 10:58:46,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:46,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:46,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 10:58:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 10:58:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 10:58:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 10:58:46,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 10:58:46,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:46,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:46,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:47,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +14: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 10:58:47,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:47,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:47,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +10: [2023-04-29 10:58:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 10:58:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 10:58:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +14: [2023-04-29 10:58:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 10:58:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +32: [2023-04-29 10:58:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 10:58:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:47,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +43: [2023-04-29 10:58:47,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +43: [2023-04-29 10:58:47,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +17: [2023-04-29 10:58:47,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:47,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +38: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +59: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +59: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +13: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +59: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +59: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +38: [2023-04-29 10:58:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +17: [2023-04-29 10:58:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:47,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:47,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 10:58:47,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 10:58:47,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 10:58:47,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +26: [2023-04-29 10:58:47,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +57: [2023-04-29 10:58:47,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:47,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +62: [2023-04-29 10:58:47,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:47,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 10:58:47,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +26: [2023-04-29 10:58:47,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:47,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:47,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:47,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +10: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:47,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +41: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +10: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 10:58:47,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 10:58:47,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 10:58:47,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:47,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 10:58:47,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:47,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 10:58:47,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +11: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +11: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +49: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:47,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +11: [2023-04-29 10:58:47,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +61: [2023-04-29 10:58:47,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +11: [2023-04-29 10:58:47,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +42: [2023-04-29 10:58:47,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 10:58:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 10:58:47,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 10:58:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 10:58:47,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +54: [2023-04-29 10:58:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +49: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:47,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 10:58:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:47,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:47,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 9: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +63: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 9: [2023-04-29 10:58:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 10:58:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 10:58:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 10:58:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +63: [2023-04-29 10:58:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +24: [2023-04-29 10:58:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 10:58:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:47,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 10:58:47,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 10:58:47,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 10:58:47,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:47,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +35: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 10:58:47,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 10:58:47,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +58: [2023-04-29 10:58:47,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 10:58:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 10:58:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +42: [2023-04-29 10:58:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +11: [2023-04-29 10:58:47,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +55: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +11: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +11: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +48: [2023-04-29 10:58:47,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 10:58:47,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 10:58:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 10:58:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +11: [2023-04-29 10:58:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 10:58:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +54: [2023-04-29 10:58:47,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 10:58:47,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 10:58:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 10:58:47,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +28: [2023-04-29 10:58:47,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 10:58:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 10:58:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 10:58:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +56: [2023-04-29 10:58:47,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:47,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 10:58:47,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 10:58:47,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 10:58:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 10:58:47,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 10:58:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 10:58:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 10:58:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. + 8: [2023-04-29 10:58:47,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 10:58:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:47,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 10:58:47,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +44: [2023-04-29 10:58:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 10:58:47,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 10:58:47,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 10:58:47,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt. +42: [2023-04-29 10:58:47,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +42: [2023-04-29 10:58:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 10:58:47,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 10:58:47,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 2: [2023-04-29 10:58:47,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 10:58:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 10:58:47,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +44: [2023-04-29 10:58:47,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +44: [2023-04-29 10:58:47,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +44: [2023-04-29 10:58:47,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 10:58:47,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 10:58:47,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 10:58:47,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 10:58:47,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:47,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +28: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 10:58:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 10:58:47,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 10:58:47,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:47,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 10:58:47,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:47,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 10:58:47,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 10:58:47,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 10:58:47,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 10:58:47,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 10:58:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 10:58:47,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +12: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +12: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +40: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +39: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +12: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +39: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 10:58:47,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:47,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 10:58:47,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:47,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:47,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:47,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +26: [2023-04-29 10:58:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 10:58:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 10:58:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:47,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 10:58:47,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +39: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +35: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +35: [2023-04-29 10:58:47,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 10:58:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:47,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 10:58:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 10:58:47,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 10:58:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 10:58:47,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +26: [2023-04-29 10:58:47,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 10:58:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +44: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 10:58:47,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 10:58:47,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:47,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 10:58:47,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:47,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 10:58:47,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +59: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +63: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +46: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +59: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +59: [2023-04-29 10:58:47,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 10:58:47,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 10:58:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 10:58:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +46: [2023-04-29 10:58:47,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 10:58:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 10:58:47,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +12: [2023-04-29 10:58:47,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:47,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 10:58:47,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:47,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 10:58:47,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 10:58:47,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 10:58:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +42: [2023-04-29 10:58:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 10:58:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 10:58:47,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 10:58:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 10:58:47,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +27: [2023-04-29 10:58:47,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +27: [2023-04-29 10:58:47,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +27: [2023-04-29 10:58:47,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +30: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +13: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +13: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 10:58:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +46: [2023-04-29 10:58:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 10:58:47,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 10:58:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:47,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +37: [2023-04-29 10:58:47,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 10:58:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 10:58:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +47: [2023-04-29 10:58:47,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 10:58:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:47,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 10:58:47,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 10:58:47,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +13: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +54: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +13: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 4: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 4: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 10:58:47,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 10:58:47,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 10:58:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 10:58:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 10:58:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 10:58:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:47,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:47,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 10:58:47,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +39: [2023-04-29 10:58:47,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 10:58:47,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +39: [2023-04-29 10:58:47,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 10:58:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 10:58:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 10:58:47,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +52: [2023-04-29 10:58:47,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +52: [2023-04-29 10:58:47,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +52: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 10:58:47,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +60: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +60: [2023-04-29 10:58:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 10:58:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 10:58:47,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 10:58:47,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +58: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +16: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +40: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 10:58:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 10:58:47,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 10:58:47,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +14: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +36: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +14: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +40: [2023-04-29 10:58:47,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +14: [2023-04-29 10:58:47,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +40: [2023-04-29 10:58:47,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 10:58:47,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +40: [2023-04-29 10:58:47,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 10:58:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +52: [2023-04-29 10:58:47,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:47,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:47,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 10:58:47,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:47,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:47,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:47,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 10:58:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 10:58:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 10:58:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 10:58:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 10:58:47,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:47,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 10:58:47,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:47,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 10:58:47,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:47,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +22: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 10:58:47,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 10:58:47,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:47,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:47,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 10:58:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 10:58:47,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +22: [2023-04-29 10:58:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +22: [2023-04-29 10:58:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +22: [2023-04-29 10:58:47,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +46: [2023-04-29 10:58:47,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 10:58:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:47,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 10:58:47,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +37: [2023-04-29 10:58:47,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 10:58:47,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +37: [2023-04-29 10:58:47,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 10:58:47,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 10:58:47,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 10:58:47,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 10:58:47,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 10:58:47,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 10:58:47,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 10:58:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 10:58:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 10:58:47,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +58: [2023-04-29 10:58:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:47,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 10:58:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 10:58:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 10:58:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 10:58:47,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 10:58:47,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 10:58:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 10:58:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +32: [2023-04-29 10:58:47,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 10:58:47,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +45: [2023-04-29 10:58:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +24: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +24: [2023-04-29 10:58:47,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 10:58:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 10:58:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 10:58:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 10:58:47,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 10:58:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +24: [2023-04-29 10:58:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +24: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +24: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +55: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 10:58:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 10:58:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +52: [2023-04-29 10:58:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 10:58:47,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +22: [2023-04-29 10:58:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 10:58:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 1: [2023-04-29 10:58:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 1: [2023-04-29 10:58:47,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +44: [2023-04-29 10:58:47,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 1: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +44: [2023-04-29 10:58:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 10:58:47,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 10:58:47,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 10:58:47,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 10:58:47,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +55: [2023-04-29 10:58:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 10:58:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 10:58:47,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +26: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +26: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 10:58:47,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt. +32: [2023-04-29 10:58:47,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 10:58:47,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 10:58:47,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +33: [2023-04-29 10:58:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +10: [2023-04-29 10:58:47,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +10: [2023-04-29 10:58:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +33: [2023-04-29 10:58:47,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 10:58:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 10:58:47,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 10:58:47,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:47,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 10:58:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 10:58:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 10:58:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 10:58:47,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 10:58:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 10:58:47,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 10:58:47,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 10:58:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 10:58:47,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 10:58:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 10:58:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 10:58:47,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 10:58:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 10:58:47,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:47,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 10:58:47,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:47,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:47,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +62: [2023-04-29 10:58:47,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:47,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 10:58:47,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 10:58:47,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 10:58:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 10:58:47,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 10:58:47,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +41: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +41: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +21: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 10:58:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:47,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:47,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 10:58:47,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 10:58:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 10:58:47,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +49: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +49: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 10:58:47,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 10:58:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 10:58:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 10:58:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:47,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 10:58:47,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +31: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:47,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +42: [2023-04-29 10:58:47,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:47,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +31: [2023-04-29 10:58:47,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +31: [2023-04-29 10:58:47,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:47,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 10:58:47,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +41: [2023-04-29 10:58:47,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 10:58:47,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 10:58:47,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:47,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 10:58:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +23: [2023-04-29 10:58:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +23: [2023-04-29 10:58:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +33: [2023-04-29 10:58:47,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 10:58:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 10:58:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 10:58:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 10:58:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 10:58:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +49: [2023-04-29 10:58:47,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 10:58:47,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 10:58:47,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 10:58:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 10:58:47,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 10:58:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 10:58:47,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +19: [2023-04-29 10:58:47,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +33: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:47,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 10:58:47,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +56: [2023-04-29 10:58:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 10:58:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +56: [2023-04-29 10:58:47,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 10:58:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 10:58:47,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 10:58:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +19: [2023-04-29 10:58:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +63: [2023-04-29 10:58:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 10:58:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +19: [2023-04-29 10:58:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +19: [2023-04-29 10:58:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 10:58:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +19: [2023-04-29 10:58:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 10:58:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +15: [2023-04-29 10:58:47,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 10:58:47,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:47,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +50: [2023-04-29 10:58:47,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 10:58:47,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 10:58:47,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 10:58:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 10:58:47,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:47,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +32: [2023-04-29 10:58:47,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 10:58:47,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +18: [2023-04-29 10:58:47,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 10:58:47,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 10:58:47,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:47,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +33: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +56: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:47,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:47,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +56: [2023-04-29 10:58:47,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 10:58:47,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +32: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +48: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 10:58:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 10:58:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 10:58:47,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 10:58:47,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:47,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 10:58:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 10:58:47,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:47,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +53: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +53: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +31: [2023-04-29 10:58:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 10:58:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 10:58:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:47,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:47,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:47,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 10:58:47,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 10:58:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:47,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:47,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 10:58:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +62: [2023-04-29 10:58:47,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:47,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 10:58:47,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 10:58:47,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:47,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:47,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +31: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +31: [2023-04-29 10:58:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 10:58:47,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 10:58:47,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 10:58:47,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:47,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 10:58:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 10:58:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +41: [2023-04-29 10:58:47,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 10:58:47,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 10:58:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 10:58:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 10:58:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 10:58:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +43: [2023-04-29 10:58:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +31: [2023-04-29 10:58:47,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +53: [2023-04-29 10:58:47,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 10:58:47,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +63: [2023-04-29 10:58:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +42: [2023-04-29 10:58:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +42: [2023-04-29 10:58:47,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 10:58:47,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 10:58:47,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 10:58:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:47,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +49: [2023-04-29 10:58:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 10:58:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +18: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 10:58:47,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 10:58:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +49: [2023-04-29 10:58:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +23: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +53: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:47,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 10:58:47,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 10:58:47,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 10:58:47,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 10:58:47,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:47,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +29: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +29: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:47,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +28: [2023-04-29 10:58:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 10:58:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +28: [2023-04-29 10:58:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 10:58:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +31: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +48: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +58: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +37: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +37: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +43: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 10:58:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 10:58:47,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 10:58:47,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 10:58:47,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +47: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 7: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 7: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +38: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 10:58:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 7: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +34: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 7: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +39: [2023-04-29 10:58:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +17: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +54: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +54: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +17: [2023-04-29 10:58:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +51: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +47: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +47: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 6: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 10:58:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +20: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +20: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +19: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 10:58:47,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +18: [2023-04-29 10:58:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 10:58:47,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 10:58:47,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 10:58:47,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 10:58:47,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 10:58:47,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +18: [2023-04-29 10:58:47,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +41: [2023-04-29 10:58:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +50: [2023-04-29 10:58:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +50: [2023-04-29 10:58:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 10:58:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 10:58:47,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 10:58:47,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +41: [2023-04-29 10:58:47,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 10:58:47,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 10:58:47,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 10:58:47,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 10:58:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 10:58:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +56: [2023-04-29 10:58:47,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 10:58:47,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +56: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +41: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 10:58:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +34: [2023-04-29 10:58:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +59: [2023-04-29 10:58:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 10:58:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 10:58:47,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 10:58:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 10:58:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 10:58:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 10:58:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 10:58:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +39: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 10:58:47,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +40: [2023-04-29 10:58:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 10:58:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 10:58:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 2: [2023-04-29 10:58:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 10:58:47,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 0: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 10:58:47,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:47,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 10:58:47,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +36: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:47,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 10:58:47,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 10:58:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +53: [2023-04-29 10:58:47,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 10:58:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 10:58:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 10:58:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 0: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +60: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +25: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. + 0: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 0: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 10:58:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +53: [2023-04-29 10:58:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +38: [2023-04-29 10:58:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 10:58:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +51: [2023-04-29 10:58:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 10:58:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 10:58:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 10:58:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +38: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +59: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 10:58:47,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:47,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 10:58:47,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +25: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +46: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 10:58:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +29: [2023-04-29 10:58:47,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 10:58:47,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +33: [2023-04-29 10:58:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 10:58:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 7: [2023-04-29 10:58:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 10:58:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +38: [2023-04-29 10:58:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 10:58:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +53: [2023-04-29 10:58:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 10:58:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 10:58:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +29: [2023-04-29 10:58:47,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +33: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +54: [2023-04-29 10:58:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 10:58:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +38: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 10:58:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 9: [2023-04-29 10:58:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 10:58:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 10:58:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 10:58:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:47,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:47,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +25: [2023-04-29 10:58:47,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 10:58:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 10:58:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 10:58:47,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 10:58:47,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 10:58:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 10:58:47,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +29: [2023-04-29 10:58:47,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +53: [2023-04-29 10:58:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 10:58:47,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 10:58:47,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 10:58:47,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 10:58:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:47,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 10:58:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 7: [2023-04-29 10:58:47,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:47,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 10:58:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 10:58:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 10:58:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 10:58:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 10:58:47,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:47,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 10:58:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 10:58:47,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +28: [2023-04-29 10:58:47,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 10:58:47,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 10:58:47,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 6: [2023-04-29 10:58:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 10:58:47,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 10:58:47,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +28: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 10:58:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 10:58:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 10:58:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 10:58:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 10:58:47,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:47,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 10:58:47,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 10:58:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +34: [2023-04-29 10:58:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 10:58:47,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 4: [2023-04-29 10:58:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 2: [2023-04-29 10:58:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 10:58:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 4: [2023-04-29 10:58:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +46: [2023-04-29 10:58:47,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 10:58:47,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 10:58:47,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 10:58:47,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 10:58:47,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +51: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +53: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 10:58:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 10:58:47,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 10:58:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +51: [2023-04-29 10:58:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 2: [2023-04-29 10:58:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 10:58:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +11: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 10:58:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 0: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +46: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 10:58:47,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +11: [2023-04-29 10:58:47,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +46: [2023-04-29 10:58:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +15: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +15: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +47: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +15: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 10:58:47,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +40: [2023-04-29 10:58:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 10:58:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +27: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +27: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +51: [2023-04-29 10:58:47,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 10:58:47,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 10:58:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 10:58:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 10:58:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 10:58:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +12: [2023-04-29 10:58:47,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +12: [2023-04-29 10:58:47,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +12: [2023-04-29 10:58:47,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:47,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +46: [2023-04-29 10:58:47,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:47,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 10:58:47,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 10:58:47,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +32: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +59: [2023-04-29 10:58:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 10:58:47,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 10:58:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:47,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 10:58:47,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:47,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 10:58:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +15: [2023-04-29 10:58:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:47,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 10:58:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +52: [2023-04-29 10:58:47,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 10:58:47,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 10:58:47,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 10:58:47,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 10:58:47,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 10:58:47,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 10:58:47,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 10:58:47,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 10:58:47,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 10:58:47,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt. +60: [2023-04-29 10:58:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 10:58:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 10:58:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 10:58:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 10:58:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 10:58:47,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 10:58:47,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 10:58:47,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 10:58:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 10:58:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 10:58:47,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 10:58:47,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 10:58:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 10:58:47,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 10:58:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 10:58:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 10:58:47,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +12: [2023-04-29 10:58:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +33: [2023-04-29 10:58:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 10:58:47,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:47,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:47,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:47,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 10:58:47,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 10:58:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 10:58:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:47,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +35: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:47,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +26: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +26: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 10:58:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 10:58:47,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 10:58:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 10:58:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +26: [2023-04-29 10:58:47,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 10:58:47,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 10:58:47,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +60: [2023-04-29 10:58:47,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:47,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 10:58:47,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 10:58:47,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:47,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:47,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:47,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:47,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +56: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 10:58:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 10:58:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 10:58:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +57: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 10:58:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:47,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +63: [2023-04-29 10:58:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... + 1: [2023-04-29 10:58:47,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:47,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 10:58:47,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 10:58:47,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:47,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 10:58:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:47,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 10:58:47,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +56: [2023-04-29 10:58:47,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:47,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 10:58:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 10:58:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 10:58:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +39: [2023-04-29 10:58:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 10:58:47,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 10:58:47,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 10:58:47,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 10:58:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 10:58:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:47,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:47,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +34: [2023-04-29 10:58:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 10:58:47,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 10:58:47,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 10:58:47,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:47,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 10:58:47,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +61: [2023-04-29 10:58:47,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:47,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:47,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. +15: [2023-04-29 10:58:47,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +34: [2023-04-29 10:58:47,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 10:58:47,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 10:58:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +15: [2023-04-29 10:58:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +15: [2023-04-29 10:58:47,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +48: [2023-04-29 10:58:47,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 10:58:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +33: [2023-04-29 10:58:47,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +26: [2023-04-29 10:58:47,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 10:58:47,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:47,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 10:58:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 10:58:47,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:47,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 10:58:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 10:58:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 10:58:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 10:58:47,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 10:58:47,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 10:58:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:47,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +50: [2023-04-29 10:58:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +61: [2023-04-29 10:58:47,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:47,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 10:58:47,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +30: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:47,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +50: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 10:58:47,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +24: [2023-04-29 10:58:47,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +24: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 10:58:47,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 10:58:47,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 10:58:47,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 10:58:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 10:58:47,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 10:58:47,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 10:58:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 10:58:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:47,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 10:58:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +63: [2023-04-29 10:58:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 10:58:47,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +59: [2023-04-29 10:58:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:47,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +59: [2023-04-29 10:58:47,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +30: [2023-04-29 10:58:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 10:58:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 10:58:47,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 10:58:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:47,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 10:58:47,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +53: [2023-04-29 10:58:47,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:47,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +59: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 10:58:47,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 10:58:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:47,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +47: [2023-04-29 10:58:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 10:58:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 10:58:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 10:58:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 10:58:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +34: [2023-04-29 10:58:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:47,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 10:58:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +30: [2023-04-29 10:58:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 10:58:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:47,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 10:58:47,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 10:58:47,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +63: [2023-04-29 10:58:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:47,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:47,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:47,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +30: [2023-04-29 10:58:47,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:47,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 10:58:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 10:58:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +39: [2023-04-29 10:58:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:47,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 10:58:47,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:47,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 10:58:47,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 10:58:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:47,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +55: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 10:58:47,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:47,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 10:58:47,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:47,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 10:58:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:47,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 10:58:47,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 10:58:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +43: [2023-04-29 10:58:47,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:47,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:47,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:47,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:47,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 10:58:47,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 10:58:47,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 10:58:47,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +59: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +48: [2023-04-29 10:58:47,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 10:58:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:47,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:47,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:47,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:47,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +50: [2023-04-29 10:58:47,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:47,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 10:58:47,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 10:58:47,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 10:58:47,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 10:58:47,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 10:58:47,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 10:58:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:47,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:47,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 10:58:47,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:47,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 10:58:47,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:47,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:47,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 10:58:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 10:58:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +20: [2023-04-29 10:58:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 10:58:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 10:58:47,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +59: [2023-04-29 10:58:47,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:47,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:47,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 10:58:47,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 10:58:47,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:47,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:47,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 10:58:47,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 10:58:47,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 10:58:47,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 10:58:47,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 10:58:47,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 10:58:47,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +59: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:47,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 10:58:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +38: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:47,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:47,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:47,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:47,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +40: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:47,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +23: [2023-04-29 10:58:47,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:47,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +19: [2023-04-29 10:58:47,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 10:58:47,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 10:58:47,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +47: [2023-04-29 10:58:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +13: [2023-04-29 10:58:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 10:58:47,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +51: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 10:58:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 10:58:47,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:47,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:47,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:47,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:47,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:47,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:47,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:47,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:47,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:47,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 10:58:47,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:47,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:47,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 10:58:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:47,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:47,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:47,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:47,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 10:58:47,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 10:58:47,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:47,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 10:58:47,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:47,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:47,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:47,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 10:58:47,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 10:58:47,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +45: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 10:58:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:47,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:47,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:48,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 10:58:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:48,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 10:58:48,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +38: [2023-04-29 10:58:48,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 10:58:48,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 10:58:48,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 10:58:48,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 10:58:48,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 10:58:48,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 10:58:48,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +49: [2023-04-29 10:58:48,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +49: [2023-04-29 10:58:48,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:48,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 10:58:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 10:58:48,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +38: [2023-04-29 10:58:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 10:58:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:48,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 10:58:48,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:48,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 10:58:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 10:58:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 10:58:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +60: [2023-04-29 10:58:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 10:58:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 10:58:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 10:58:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 10:58:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 10:58:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 10:58:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:48,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:48,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 10:58:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:48,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 10:58:48,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 10:58:48,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 10:58:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:48,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 10:58:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 10:58:48,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 10:58:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 10:58:48,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 10:58:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:48,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 10:58:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +25: [2023-04-29 10:58:48,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 10:58:48,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 10:58:48,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +20: [2023-04-29 10:58:48,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +25: [2023-04-29 10:58:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +43: [2023-04-29 10:58:48,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 10:58:48,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 10:58:48,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 10:58:48,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 10:58:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:48,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 10:58:48,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:48,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 10:58:48,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 10:58:48,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +17: [2023-04-29 10:58:48,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 10:58:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +17: [2023-04-29 10:58:48,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +58: [2023-04-29 10:58:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:48,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 10:58:48,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 10:58:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 10:58:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +44: [2023-04-29 10:58:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 10:58:48,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:48,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 10:58:48,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:48,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +18: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +18: [2023-04-29 10:58:48,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 10:58:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +25: [2023-04-29 10:58:48,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:48,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 10:58:48,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +28: [2023-04-29 10:58:48,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 10:58:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 10:58:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 10:58:48,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 10:58:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +49: [2023-04-29 10:58:48,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +44: [2023-04-29 10:58:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 10:58:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 10:58:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 10:58:48,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 10:58:48,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 10:58:48,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 10:58:48,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 10:58:48,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +42: [2023-04-29 10:58:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 10:58:48,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 10:58:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +62: [2023-04-29 10:58:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 10:58:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 10:58:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +42: [2023-04-29 10:58:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +11: [2023-04-29 10:58:48,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +11: [2023-04-29 10:58:48,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 10:58:48,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +42: [2023-04-29 10:58:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +28: [2023-04-29 10:58:48,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 6: [2023-04-29 10:58:48,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +58: [2023-04-29 10:58:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +27: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +27: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 10:58:48,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 10:58:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +27: [2023-04-29 10:58:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 10:58:48,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 6: [2023-04-29 10:58:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 10:58:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +29: [2023-04-29 10:58:48,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 10:58:48,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 10:58:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 10:58:48,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 10:58:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +29: [2023-04-29 10:58:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 10:58:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +58: [2023-04-29 10:58:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +22: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +44: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 10:58:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 10:58:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 10:58:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 10:58:48,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +17: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 10:58:48,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 10:58:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 10:58:48,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +58: [2023-04-29 10:58:48,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:48,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 10:58:48,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 10:58:48,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 10:58:48,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 10:58:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 10:58:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 10:58:48,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:48,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 10:58:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 10:58:48,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 10:58:48,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +25: [2023-04-29 10:58:48,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 10:58:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +25: [2023-04-29 10:58:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +25: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 10:58:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 10:58:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 10:58:48,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +31: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +41: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +31: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +41: [2023-04-29 10:58:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +17: [2023-04-29 10:58:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +17: [2023-04-29 10:58:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 10:58:48,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +41: [2023-04-29 10:58:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 10:58:48,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +18: [2023-04-29 10:58:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 10:58:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 10:58:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +30: [2023-04-29 10:58:48,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 10:58:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +30: [2023-04-29 10:58:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 10:58:48,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 10:58:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 10:58:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 10:58:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 10:58:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 10:58:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 10:58:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +13: [2023-04-29 10:58:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +13: [2023-04-29 10:58:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +13: [2023-04-29 10:58:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +13: [2023-04-29 10:58:48,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +36: [2023-04-29 10:58:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 10:58:48,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 10:58:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 10:58:48,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 10:58:48,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 10:58:48,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 10:58:48,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 10:58:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +11: [2023-04-29 10:58:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:48,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:48,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 10:58:48,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 10:58:48,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 10:58:48,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 10:58:48,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +44: [2023-04-29 10:58:48,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +28: [2023-04-29 10:58:48,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:48,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 10:58:48,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 10:58:48,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 10:58:48,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:48,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +52: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +52: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +52: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +52: [2023-04-29 10:58:48,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +42: [2023-04-29 10:58:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +37: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 10:58:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +62: [2023-04-29 10:58:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +42: [2023-04-29 10:58:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 10:58:48,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 10:58:48,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 10:58:48,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:48,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 10:58:48,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 10:58:48,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +41: [2023-04-29 10:58:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 10:58:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 10:58:48,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +12: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 10:58:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +17: [2023-04-29 10:58:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +37: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +13: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +52: [2023-04-29 10:58:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 10:58:48,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +12: [2023-04-29 10:58:48,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 10:58:48,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 10:58:48,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +37: [2023-04-29 10:58:48,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:48,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +52: [2023-04-29 10:58:48,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:48,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 10:58:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 10:58:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +21: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +32: [2023-04-29 10:58:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 10:58:48,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 10:58:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 10:58:48,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 10:58:48,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +41: [2023-04-29 10:58:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 10:58:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +32: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 10:58:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 10:58:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +32: [2023-04-29 10:58:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +29: [2023-04-29 10:58:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 10:58:48,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 10:58:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +61: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +61: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 10:58:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +46: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +61: [2023-04-29 10:58:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 10:58:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 10:58:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 10:58:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 10:58:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 10:58:48,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 10:58:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 10:58:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +46: [2023-04-29 10:58:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 10:58:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +46: [2023-04-29 10:58:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 10:58:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 10:58:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:48,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 10:58:48,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +41: [2023-04-29 10:58:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 10:58:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:48,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 10:58:48,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 10:58:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +12: [2023-04-29 10:58:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 10:58:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 10:58:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 10:58:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 10:58:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +12: [2023-04-29 10:58:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 10:58:48,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 10:58:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 10:58:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 10:58:48,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +30: [2023-04-29 10:58:48,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 10:58:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +26: [2023-04-29 10:58:48,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 10:58:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 10:58:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +13: [2023-04-29 10:58:48,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +45: [2023-04-29 10:58:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 10:58:48,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 10:58:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 10:58:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 10:58:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +13: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +45: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +27: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +45: [2023-04-29 10:58:48,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:48,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +13: [2023-04-29 10:58:48,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +52: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +52: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +52: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +45: [2023-04-29 10:58:48,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 10:58:48,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 10:58:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:48,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:48,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 10:58:48,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 10:58:48,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 10:58:48,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +30: [2023-04-29 10:58:48,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 10:58:48,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +54: [2023-04-29 10:58:48,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:48,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 10:58:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 10:58:48,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 10:58:48,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +54: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +54: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 10:58:48,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:48,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 10:58:48,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 10:58:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 10:58:48,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +52: [2023-04-29 10:58:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +14: [2023-04-29 10:58:48,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:48,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 10:58:48,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 10:58:48,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 10:58:48,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +27: [2023-04-29 10:58:48,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +46: [2023-04-29 10:58:48,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 10:58:48,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 10:58:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 10:58:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +45: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt... +45: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 10:58:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +46: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +32: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 10:58:48,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +24: [2023-04-29 10:58:48,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 10:58:48,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 10:58:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +27: [2023-04-29 10:58:48,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +61: [2023-04-29 10:58:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 10:58:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:48,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 10:58:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 10:58:48,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 10:58:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +16: [2023-04-29 10:58:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +16: [2023-04-29 10:58:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +16: [2023-04-29 10:58:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +46: [2023-04-29 10:58:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 10:58:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +20: [2023-04-29 10:58:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +16: [2023-04-29 10:58:48,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 10:58:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +20: [2023-04-29 10:58:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +46: [2023-04-29 10:58:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +13: [2023-04-29 10:58:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 10:58:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 10:58:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 10:58:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 10:58:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 10:58:48,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +61: [2023-04-29 10:58:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 10:58:48,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +32: [2023-04-29 10:58:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 10:58:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:48,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:48,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +19: [2023-04-29 10:58:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +45: [2023-04-29 10:58:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:48,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +19: [2023-04-29 10:58:48,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 10:58:48,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +52: [2023-04-29 10:58:48,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 10:58:48,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 10:58:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 10:58:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 10:58:48,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +30: [2023-04-29 10:58:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 10:58:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 10:58:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 10:58:48,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +30: [2023-04-29 10:58:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 10:58:48,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +22: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +37: [2023-04-29 10:58:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +50: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +37: [2023-04-29 10:58:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +16: [2023-04-29 10:58:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 10:58:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +16: [2023-04-29 10:58:48,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 10:58:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +55: [2023-04-29 10:58:48,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 10:58:48,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 10:58:48,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +46: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +46: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +46: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +21: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 10:58:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +21: [2023-04-29 10:58:48,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 10:58:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 10:58:48,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 10:58:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 10:58:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 10:58:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 10:58:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 10:58:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 10:58:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 10:58:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +36: [2023-04-29 10:58:48,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 10:58:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 10:58:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +45: [2023-04-29 10:58:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 10:58:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +36: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +34: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 10:58:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 10:58:48,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 10:58:48,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 10:58:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 10:58:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 10:58:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 10:58:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 10:58:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 10:58:48,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 10:58:48,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 10:58:48,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:48,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:48,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +46: [2023-04-29 10:58:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +46: [2023-04-29 10:58:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +39: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +39: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 10:58:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +36: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +18: [2023-04-29 10:58:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +18: [2023-04-29 10:58:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +35: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +45: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +57: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +47: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +47: [2023-04-29 10:58:48,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 10:58:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 10:58:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:48,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:48,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +15: [2023-04-29 10:58:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +34: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 10:58:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +38: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +35: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +15: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 10:58:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +15: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +15: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 10:58:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 10:58:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 10:58:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 10:58:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:48,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +53: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +53: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +53: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 10:58:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +33: [2023-04-29 10:58:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:48,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +32: [2023-04-29 10:58:48,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +32: [2023-04-29 10:58:48,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +32: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +16: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 10:58:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 10:58:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +33: [2023-04-29 10:58:48,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +51: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +62: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +51: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 10:58:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +47: [2023-04-29 10:58:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:48,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +50: [2023-04-29 10:58:48,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 10:58:48,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 10:58:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 10:58:48,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 10:58:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 10:58:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 10:58:48,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 10:58:48,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 10:58:48,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +25: [2023-04-29 10:58:48,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +56: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +25: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +56: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:48,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 10:58:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 10:58:48,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 10:58:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 10:58:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:48,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +48: [2023-04-29 10:58:48,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +63: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:48,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +59: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +59: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 6: [2023-04-29 10:58:48,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 9: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +53: [2023-04-29 10:58:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +23: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... + 1: [2023-04-29 10:58:48,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 10:58:48,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 1: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +41: [2023-04-29 10:58:48,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:48,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +43: [2023-04-29 10:58:48,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 10:58:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 10:58:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 10:58:48,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 10:58:48,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +16: [2023-04-29 10:58:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 10:58:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +57: [2023-04-29 10:58:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 10:58:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:48,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +46: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 10:58:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:48,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +41: [2023-04-29 10:58:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +41: [2023-04-29 10:58:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +57: [2023-04-29 10:58:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +25: [2023-04-29 10:58:48,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +41: [2023-04-29 10:58:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 10:58:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 10:58:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +16: [2023-04-29 10:58:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +16: [2023-04-29 10:58:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +16: [2023-04-29 10:58:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +16: [2023-04-29 10:58:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:48,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +21: [2023-04-29 10:58:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 10:58:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +46: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +35: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 10:58:48,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 10:58:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:48,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:48,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 10:58:48,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:48,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:48,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +46: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +34: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +38: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 10:58:48,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 10:58:48,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +34: [2023-04-29 10:58:48,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 6: [2023-04-29 10:58:48,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 10:58:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +15: [2023-04-29 10:58:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +17: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +57: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +17: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +43: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +34: [2023-04-29 10:58:48,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 10:58:48,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 10:58:48,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 10:58:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +34: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +11: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 10:58:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +43: [2023-04-29 10:58:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 10:58:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +15: [2023-04-29 10:58:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +42: [2023-04-29 10:58:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 10:58:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 10:58:48,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 10:58:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +15: [2023-04-29 10:58:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +38: [2023-04-29 10:58:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 10:58:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 10:58:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 10:58:48,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:48,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 10:58:48,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 10:58:48,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:48,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 10:58:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 10:58:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:48,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +47: [2023-04-29 10:58:48,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 10:58:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +39: [2023-04-29 10:58:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +47: [2023-04-29 10:58:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +56: [2023-04-29 10:58:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 10:58:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 10:58:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +17: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 10:58:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +17: [2023-04-29 10:58:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 10:58:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 10:58:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 10:58:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 10:58:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +56: [2023-04-29 10:58:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 10:58:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +53: [2023-04-29 10:58:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +32: [2023-04-29 10:58:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 10:58:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 10:58:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 10:58:48,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 10:58:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +58: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +11: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +32: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +63: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +53: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 10:58:48,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +55: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 10:58:48,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +62: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +62: [2023-04-29 10:58:48,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 10:58:48,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:48,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 10:58:48,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 10:58:48,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +58: [2023-04-29 10:58:48,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 10:58:48,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 10:58:48,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:48,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:48,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +62: [2023-04-29 10:58:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:48,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +44: [2023-04-29 10:58:48,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +44: [2023-04-29 10:58:48,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +32: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 10:58:48,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +62: [2023-04-29 10:58:48,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:48,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 10:58:48,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 10:58:48,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 10:58:48,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 10:58:48,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +52: [2023-04-29 10:58:48,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 10:58:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +32: [2023-04-29 10:58:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +32: [2023-04-29 10:58:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +26: [2023-04-29 10:58:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +33: [2023-04-29 10:58:48,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 10:58:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +32: [2023-04-29 10:58:48,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 10:58:48,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 10:58:48,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +60: [2023-04-29 10:58:48,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +60: [2023-04-29 10:58:48,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 10:58:48,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:48,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:48,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:48,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 10:58:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +59: [2023-04-29 10:58:48,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 10:58:48,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 10:58:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 10:58:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 10:58:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +27: [2023-04-29 10:58:48,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +27: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +59: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 1: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 10:58:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 0: [2023-04-29 10:58:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 10:58:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 10:58:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 10:58:48,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:48,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:48,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 10:58:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:48,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 10:58:48,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +62: [2023-04-29 10:58:48,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 10:58:48,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 10:58:48,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 10:58:48,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +28: [2023-04-29 10:58:48,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 10:58:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 10:58:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +28: [2023-04-29 10:58:48,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +39: [2023-04-29 10:58:48,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:48,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +33: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +12: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 10:58:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +49: [2023-04-29 10:58:48,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 10:58:48,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 10:58:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 10:58:48,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 10:58:48,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +37: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +37: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +36: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +37: [2023-04-29 10:58:48,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +49: [2023-04-29 10:58:48,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 10:58:48,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 10:58:48,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 10:58:48,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +60: [2023-04-29 10:58:48,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 10:58:48,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:48,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:48,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 10:58:48,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 10:58:48,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 10:58:48,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:48,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 10:58:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 10:58:48,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +35: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +14: [2023-04-29 10:58:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. +49: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +54: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +14: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 10:58:48,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +61: [2023-04-29 10:58:48,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. +60: [2023-04-29 10:58:48,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:48,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 10:58:48,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 10:58:48,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 10:58:48,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +54: [2023-04-29 10:58:48,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 10:58:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +35: [2023-04-29 10:58:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 10:58:48,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:48,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +28: [2023-04-29 10:58:48,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 10:58:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 5: [2023-04-29 10:58:48,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 10:58:48,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 10:58:48,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +13: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +13: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 10:58:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +28: [2023-04-29 10:58:48,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 10:58:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 10:58:48,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 10:58:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 10:58:48,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:48,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:48,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 10:58:48,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 10:58:48,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 10:58:48,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:48,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:48,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +41: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 10:58:48,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:48,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 10:58:48,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 10:58:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 10:58:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 10:58:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:48,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 10:58:48,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 10:58:48,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +19: [2023-04-29 10:58:48,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +49: [2023-04-29 10:58:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:48,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 10:58:48,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 10:58:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +62: [2023-04-29 10:58:48,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 10:58:48,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +39: [2023-04-29 10:58:48,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +32: [2023-04-29 10:58:48,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:48,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:48,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +45: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +47: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +10: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +31: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 10:58:48,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:48,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +60: [2023-04-29 10:58:48,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +49: [2023-04-29 10:58:48,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 10:58:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +42: [2023-04-29 10:58:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +42: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +49: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +59: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 10:58:48,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:48,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 10:58:48,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:48,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +62: [2023-04-29 10:58:48,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +10: [2023-04-29 10:58:48,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +10: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +39: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +49: [2023-04-29 10:58:48,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +59: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +10: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 10:58:48,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 10:58:48,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:48,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 10:58:48,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 10:58:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 10:58:48,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 10:58:48,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 5: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +30: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +54: [2023-04-29 10:58:48,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +47: [2023-04-29 10:58:48,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +60: [2023-04-29 10:58:48,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +39: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:48,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +40: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +20: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +37: [2023-04-29 10:58:48,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 10:58:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 10:58:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +37: [2023-04-29 10:58:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +54: [2023-04-29 10:58:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +47: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 10:58:48,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:48,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +20: [2023-04-29 10:58:48,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 10:58:48,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 10:58:48,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +24: [2023-04-29 10:58:48,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +24: [2023-04-29 10:58:48,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:48,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:48,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 10:58:48,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 10:58:48,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:48,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:48,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 10:58:48,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 10:58:48,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:48,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:48,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:48,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 10:58:48,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:48,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:48,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 3: [2023-04-29 10:58:48,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +41: [2023-04-29 10:58:48,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:48,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 10:58:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +61: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +16: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:48,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:48,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 10:58:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 10:58:48,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:48,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... +61: [2023-04-29 10:58:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt... + 2: [2023-04-29 10:58:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +55: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 7: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +20: [2023-04-29 10:58:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +55: [2023-04-29 10:58:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +55: [2023-04-29 10:58:48,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:48,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 10:58:48,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 10:58:48,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 10:58:48,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 10:58:48,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +57: [2023-04-29 10:58:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +41: [2023-04-29 10:58:48,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:48,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +41: [2023-04-29 10:58:48,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:48,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +36: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 10:58:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 10:58:48,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +16: [2023-04-29 10:58:48,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 10:58:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 10:58:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:48,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +35: [2023-04-29 10:58:48,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 10:58:48,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +55: [2023-04-29 10:58:48,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 10:58:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 10:58:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 10:58:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 10:58:48,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 10:58:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +31: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 10:58:48,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 10:58:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:48,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +45: [2023-04-29 10:58:48,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:48,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:48,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 10:58:48,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:48,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:48,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +45: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:48,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +29: [2023-04-29 10:58:48,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 10:58:48,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 10:58:48,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 10:58:48,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +36: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 10:58:48,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 10:58:48,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:48,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +45: [2023-04-29 10:58:48,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 10:58:48,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +59: [2023-04-29 10:58:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:48,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +48: [2023-04-29 10:58:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:48,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 10:58:48,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:48,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:48,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:48,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 10:58:48,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:48,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +48: [2023-04-29 10:58:48,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 10:58:48,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:48,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 10:58:48,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +37: [2023-04-29 10:58:48,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 10:58:48,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +59: [2023-04-29 10:58:48,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 10:58:48,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 10:58:48,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 10:58:48,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:48,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:48,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 10:58:48,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:48,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +41: [2023-04-29 10:58:48,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:48,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:48,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 10:58:48,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:48,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 10:58:48,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 10:58:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:48,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 10:58:48,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:48,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:48,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 10:58:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 10:58:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 10:58:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 10:58:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:48,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:48,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 10:58:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 10:58:48,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 10:58:48,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:48,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +33: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:48,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 10:58:48,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 10:58:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +33: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:48,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 8: [2023-04-29 10:58:48,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:48,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +11: [2023-04-29 10:58:48,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +55: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +25: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +25: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +11: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +11: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:48,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +25: [2023-04-29 10:58:48,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 10:58:48,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:48,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:48,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +28: [2023-04-29 10:58:48,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 10:58:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +60: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:48,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +60: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 10:58:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +44: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 10:58:48,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:48,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:48,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 10:58:48,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 10:58:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 10:58:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 10:58:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 10:58:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 10:58:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +44: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +57: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:48,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +14: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +55: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +29: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +55: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:48,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +50: [2023-04-29 10:58:48,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +22: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 10:58:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 10:58:48,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +36: [2023-04-29 10:58:48,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 10:58:48,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 10:58:48,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 10:58:48,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 10:58:48,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 10:58:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +63: [2023-04-29 10:58:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:48,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:48,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:48,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:48,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +17: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +35: [2023-04-29 10:58:48,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +52: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 0: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +52: [2023-04-29 10:58:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 10:58:48,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 10:58:48,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 10:58:48,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 10:58:48,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +54: [2023-04-29 10:58:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +53: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +53: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:48,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 10:58:48,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:48,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 10:58:48,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 10:58:48,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 10:58:48,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 10:58:48,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +41: [2023-04-29 10:58:48,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 10:58:48,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:48,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:48,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:48,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 10:58:48,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 10:58:48,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:48,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 10:58:48,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:48,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 10:58:48,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +53: [2023-04-29 10:58:48,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:48,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:48,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +29: [2023-04-29 10:58:48,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:48,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:48,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +41: [2023-04-29 10:58:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 10:58:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:48,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +43: [2023-04-29 10:58:48,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 10:58:48,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 10:58:48,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 10:58:48,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 10:58:48,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 10:58:48,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 10:58:48,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:48,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 10:58:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 10:58:48,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 10:58:48,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:48,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 10:58:48,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +22: [2023-04-29 10:58:48,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +22: [2023-04-29 10:58:48,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:48,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +40: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 10:58:48,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +25: [2023-04-29 10:58:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:48,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 10:58:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:48,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:48,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:48,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 10:58:48,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:48,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 10:58:48,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:48,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 10:58:48,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:48,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:48,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 10:58:48,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:48,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:48,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 10:58:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +39: [2023-04-29 10:58:48,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +21: [2023-04-29 10:58:48,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +52: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +52: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +52: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +50: [2023-04-29 10:58:48,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +63: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +14: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +63: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +25: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 10:58:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 10:58:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +27: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +47: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:48,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +25: [2023-04-29 10:58:48,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +44: [2023-04-29 10:58:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 10:58:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +33: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +27: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 10:58:48,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +14: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +42: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 10:58:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +27: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 10:58:48,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +50: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +47: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 10:58:48,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 10:58:48,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:48,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 10:58:48,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 10:58:48,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 10:58:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +32: [2023-04-29 10:58:48,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +32: [2023-04-29 10:58:48,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 10:58:48,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +26: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +33: [2023-04-29 10:58:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 10:58:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +15: [2023-04-29 10:58:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 10:58:48,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 10:58:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 10:58:48,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +33: [2023-04-29 10:58:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +26: [2023-04-29 10:58:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +50: [2023-04-29 10:58:48,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 10:58:48,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 10:58:48,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:48,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 10:58:48,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +17: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:48,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 10:58:48,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 10:58:48,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 10:58:48,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 10:58:48,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +15: [2023-04-29 10:58:48,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:48,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +42: [2023-04-29 10:58:48,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +16: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +16: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 10:58:48,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +47: [2023-04-29 10:58:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +47: [2023-04-29 10:58:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 10:58:48,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 10:58:48,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. + 1: [2023-04-29 10:58:48,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 10:58:48,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 10:58:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +38: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +52: [2023-04-29 10:58:48,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:48,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 10:58:48,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 10:58:48,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:48,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 10:58:48,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 10:58:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 10:58:48,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 10:58:48,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:48,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:48,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 10:58:48,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 10:58:48,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 10:58:48,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 10:58:48,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:48,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 10:58:48,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +60: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +12: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 10:58:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 10:58:48,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 10:58:48,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +62: [2023-04-29 10:58:48,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:48,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 10:58:48,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +58: [2023-04-29 10:58:48,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 10:58:48,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +12: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +13: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +12: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +17: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +12: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 10:58:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 10:58:48,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 10:58:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +15: [2023-04-29 10:58:48,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +62: [2023-04-29 10:58:48,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 10:58:48,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 10:58:48,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 10:58:48,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:48,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 10:58:48,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:48,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +51: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +60: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +40: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:48,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +62: [2023-04-29 10:58:48,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 10:58:48,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +56: [2023-04-29 10:58:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +56: [2023-04-29 10:58:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +56: [2023-04-29 10:58:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +62: [2023-04-29 10:58:48,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 6: [2023-04-29 10:58:48,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:48,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 10:58:48,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:48,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:48,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 10:58:48,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 10:58:48,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 10:58:48,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:48,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:48,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:48,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 10:58:48,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +49: [2023-04-29 10:58:48,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +34: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 10:58:48,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +51: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 0: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 10:58:48,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 10:58:48,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +49: [2023-04-29 10:58:48,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +23: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +23: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:48,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:48,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 10:58:48,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 10:58:48,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 10:58:48,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 10:58:48,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +22: [2023-04-29 10:58:48,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 10:58:48,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 10:58:48,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 10:58:48,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 10:58:48,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +58: [2023-04-29 10:58:48,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 10:58:48,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 10:58:48,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 10:58:48,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 10:58:48,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +37: [2023-04-29 10:58:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 10:58:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +37: [2023-04-29 10:58:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:48,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 10:58:48,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:48,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +37: [2023-04-29 10:58:48,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:48,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 10:58:48,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +48: [2023-04-29 10:58:48,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +48: [2023-04-29 10:58:48,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +56: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 10:58:48,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 10:58:48,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 10:58:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:48,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 10:58:48,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 10:58:48,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:48,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:48,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:48,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:48,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:48,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:48,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 10:58:48,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 10:58:48,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 10:58:48,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +34: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +63: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 10:58:48,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 10:58:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 10:58:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +26: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +54: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +54: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +23: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +47: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +46: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 1: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +61: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +38: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 10:58:48,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 10:58:48,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +46: [2023-04-29 10:58:48,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 1: [2023-04-29 10:58:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +46: [2023-04-29 10:58:48,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 10:58:48,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 3: [2023-04-29 10:58:48,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +13: [2023-04-29 10:58:48,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 10:58:48,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 10:58:48,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:48,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +47: [2023-04-29 10:58:48,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:48,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:48,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:48,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:48,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +15: [2023-04-29 10:58:48,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 10:58:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 10:58:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +32: [2023-04-29 10:58:48,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:48,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 10:58:48,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:48,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 10:58:48,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +46: [2023-04-29 10:58:48,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 10:58:48,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 10:58:48,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 10:58:48,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 10:58:48,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 1: [2023-04-29 10:58:49,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:48,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 10:58:48,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:48,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:48,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 10:58:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 10:58:49,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 10:58:49,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 10:58:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 10:58:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 10:58:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 10:58:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:49,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 10:58:49,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:49,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +12: [2023-04-29 10:58:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 10:58:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +39: [2023-04-29 10:58:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:49,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 10:58:49,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 10:58:49,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 10:58:49,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 10:58:49,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +16: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 10:58:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +56: [2023-04-29 10:58:49,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:49,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:49,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 10:58:49,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 10:58:49,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 10:58:49,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 10:58:49,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:49,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 10:58:49,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 10:58:49,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 10:58:49,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +26: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:49,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 10:58:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +13: [2023-04-29 10:58:49,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 10:58:49,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 1: [2023-04-29 10:58:49,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 10:58:49,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:49,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 10:58:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +12: [2023-04-29 10:58:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 10:58:49,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:49,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:49,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:49,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +58: [2023-04-29 10:58:49,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 10:58:49,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +37: [2023-04-29 10:58:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +51: [2023-04-29 10:58:49,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:49,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:49,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +12: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 10:58:49,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 10:58:49,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 10:58:49,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +12: [2023-04-29 10:58:49,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +37: [2023-04-29 10:58:49,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +13: [2023-04-29 10:58:49,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 10:58:49,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:49,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 10:58:49,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:49,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:49,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 10:58:49,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 10:58:49,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +53: [2023-04-29 10:58:49,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 10:58:49,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:49,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:49,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +37: [2023-04-29 10:58:49,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 10:58:49,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +14: [2023-04-29 10:58:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +14: [2023-04-29 10:58:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +56: [2023-04-29 10:58:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 10:58:49,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt. +49: [2023-04-29 10:58:49,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +36: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +36: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +36: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 10:58:49,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 10:58:49,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:49,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:49,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 10:58:49,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 10:58:49,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 10:58:49,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:49,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +37: [2023-04-29 10:58:49,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +20: [2023-04-29 10:58:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +53: [2023-04-29 10:58:49,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +33: [2023-04-29 10:58:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 10:58:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 10:58:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 10:58:49,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 10:58:49,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 10:58:49,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 10:58:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 10:58:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 10:58:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 10:58:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +20: [2023-04-29 10:58:49,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +56: [2023-04-29 10:58:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 10:58:49,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 10:58:49,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:49,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 10:58:49,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:49,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:49,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:49,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 10:58:49,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 10:58:49,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 10:58:49,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt. +60: [2023-04-29 10:58:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 10:58:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +61: [2023-04-29 10:58:49,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 10:58:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +56: [2023-04-29 10:58:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +14: [2023-04-29 10:58:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 10:58:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 10:58:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +14: [2023-04-29 10:58:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 10:58:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 10:58:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 10:58:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 10:58:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 10:58:49,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:49,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:49,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 10:58:49,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:49,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +33: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 10:58:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:49,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:49,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 10:58:49,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 10:58:49,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:49,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 10:58:49,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 10:58:49,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 10:58:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:49,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 10:58:49,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 10:58:49,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 10:58:49,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:49,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 10:58:49,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +61: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +23: [2023-04-29 10:58:49,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 10:58:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 10:58:49,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 10:58:49,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +23: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +23: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 10:58:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 10:58:49,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +57: [2023-04-29 10:58:49,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:49,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:49,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +34: [2023-04-29 10:58:49,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 10:58:49,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 10:58:49,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 10:58:49,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:49,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 10:58:49,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 10:58:49,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 10:58:49,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 10:58:49,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +59: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +41: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +40: [2023-04-29 10:58:49,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 10:58:49,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:49,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 10:58:49,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:49,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:49,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +45: [2023-04-29 10:58:49,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 10:58:49,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 10:58:49,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 10:58:49,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +45: [2023-04-29 10:58:49,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +53: [2023-04-29 10:58:49,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 10:58:49,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +20: [2023-04-29 10:58:49,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +60: [2023-04-29 10:58:49,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:49,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 10:58:49,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:49,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 10:58:49,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 10:58:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 10:58:49,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:49,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:49,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 10:58:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 10:58:49,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +60: [2023-04-29 10:58:49,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 10:58:49,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:49,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:49,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 10:58:49,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 10:58:49,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 10:58:49,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 10:58:49,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 10:58:49,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:49,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 10:58:49,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:49,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 10:58:49,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +31: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +33: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +35: [2023-04-29 10:58:49,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +31: [2023-04-29 10:58:49,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 10:58:49,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 10:58:49,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 10:58:49,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 10:58:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 10:58:49,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +33: [2023-04-29 10:58:49,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 10:58:49,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 10:58:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 10:58:49,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +60: [2023-04-29 10:58:49,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 10:58:49,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 10:58:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 10:58:49,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +40: [2023-04-29 10:58:49,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +50: [2023-04-29 10:58:49,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:49,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 10:58:49,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +35: [2023-04-29 10:58:49,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 10:58:49,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:49,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +50: [2023-04-29 10:58:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:49,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +40: [2023-04-29 10:58:49,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 10:58:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 10:58:49,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:49,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt. +31: [2023-04-29 10:58:49,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 10:58:49,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 10:58:49,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +40: [2023-04-29 10:58:49,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +40: [2023-04-29 10:58:49,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 10:58:49,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 10:58:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +40: [2023-04-29 10:58:49,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 10:58:49,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:49,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 10:58:49,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 10:58:49,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +19: [2023-04-29 10:58:49,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 10:58:49,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:49,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 10:58:49,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +34: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +14: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +34: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +24: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +40: [2023-04-29 10:58:49,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +40: [2023-04-29 10:58:49,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 10:58:49,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt... +40: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 10:58:49,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:49,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 10:58:49,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:49,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +19: [2023-04-29 10:58:49,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +41: [2023-04-29 10:58:49,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:49,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:49,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:49,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 10:58:49,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +60: [2023-04-29 10:58:49,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:49,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 10:58:49,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +19: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 10:58:49,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:49,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +57: [2023-04-29 10:58:49,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:49,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:49,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:49,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 10:58:49,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 10:58:49,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +60: [2023-04-29 10:58:49,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:49,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 10:58:49,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 10:58:49,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:49,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:49,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:49,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:49,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:49,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +50: [2023-04-29 10:58:49,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 10:58:49,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 10:58:49,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +43: [2023-04-29 10:58:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +43: [2023-04-29 10:58:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +31: [2023-04-29 10:58:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +43: [2023-04-29 10:58:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +60: [2023-04-29 10:58:49,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:49,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 10:58:49,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 9: [2023-04-29 10:58:49,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +60: [2023-04-29 10:58:49,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +17: [2023-04-29 10:58:49,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:49,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:49,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +40: [2023-04-29 10:58:49,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:49,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +40: [2023-04-29 10:58:49,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 10:58:49,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:49,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 10:58:49,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 10:58:49,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 10:58:49,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:49,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +50: [2023-04-29 10:58:49,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:49,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 10:58:49,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:49,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +43: [2023-04-29 10:58:49,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:49,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:49,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:49,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 10:58:49,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 10:58:49,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 10:58:49,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +50: [2023-04-29 10:58:49,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 10:58:49,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:49,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +14: [2023-04-29 10:58:49,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 10:58:49,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:49,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 10:58:49,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 10:58:49,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 10:58:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 10:58:49,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:49,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +31: [2023-04-29 10:58:49,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 10:58:49,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +53: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 10:58:49,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +53: [2023-04-29 10:58:49,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:49,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 10:58:49,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 10:58:49,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +40: [2023-04-29 10:58:49,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 10:58:49,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 10:58:49,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 10:58:49,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 10:58:49,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:49,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:49,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 10:58:49,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:49,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 10:58:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 10:58:49,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +28: [2023-04-29 10:58:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 10:58:49,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 10:58:49,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 10:58:49,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:49,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +31: [2023-04-29 10:58:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:49,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 10:58:49,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:49,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:49,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:49,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +53: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:49,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:49,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:49,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +46: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +46: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +46: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +46: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +11: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +11: [2023-04-29 10:58:49,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +44: [2023-04-29 10:58:49,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +44: [2023-04-29 10:58:49,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +44: [2023-04-29 10:58:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +44: [2023-04-29 10:58:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 10:58:49,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +11: [2023-04-29 10:58:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 10:58:49,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:49,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +16: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +16: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 10:58:49,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 10:58:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +46: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +17: [2023-04-29 10:58:49,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +46: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:49,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +18: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +18: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +44: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 6: [2023-04-29 10:58:49,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +11: [2023-04-29 10:58:49,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +44: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 6: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 10:58:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 10:58:49,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +26: [2023-04-29 10:58:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +26: [2023-04-29 10:58:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 10:58:49,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 10:58:49,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:49,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 10:58:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +30: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:49,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +38: [2023-04-29 10:58:49,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +38: [2023-04-29 10:58:49,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +38: [2023-04-29 10:58:49,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +28: [2023-04-29 10:58:49,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 10:58:49,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 10:58:49,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:49,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:49,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:49,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +38: [2023-04-29 10:58:49,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:49,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:49,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 10:58:49,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 10:58:49,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:49,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 10:58:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 10:58:49,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +46: [2023-04-29 10:58:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 10:58:49,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 10:58:49,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:49,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:49,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 10:58:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 10:58:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +46: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +24: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 10:58:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +39: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +39: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +11: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +11: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +11: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 10:58:49,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 10:58:49,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:49,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:49,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +11: [2023-04-29 10:58:49,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 10:58:49,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +46: [2023-04-29 10:58:49,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +30: [2023-04-29 10:58:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +11: [2023-04-29 10:58:49,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +46: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +22: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +30: [2023-04-29 10:58:49,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +12: [2023-04-29 10:58:49,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:49,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 10:58:49,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 10:58:49,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +10: [2023-04-29 10:58:49,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 10:58:49,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:49,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 10:58:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:49,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 10:58:49,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 10:58:49,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 10:58:49,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 10:58:49,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 10:58:49,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 4: [2023-04-29 10:58:49,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +30: [2023-04-29 10:58:49,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +17: [2023-04-29 10:58:49,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +30: [2023-04-29 10:58:49,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 10:58:49,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +17: [2023-04-29 10:58:49,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 10:58:49,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 10:58:49,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 10:58:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 10:58:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +22: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +25: [2023-04-29 10:58:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +17: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +17: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 10:58:49,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 10:58:49,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +22: [2023-04-29 10:58:49,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 10:58:49,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:49,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +18: [2023-04-29 10:58:49,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 10:58:49,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:49,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 10:58:49,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +38: [2023-04-29 10:58:49,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 10:58:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 10:58:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 10:58:49,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +62: [2023-04-29 10:58:49,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 10:58:49,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +26: [2023-04-29 10:58:49,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +62: [2023-04-29 10:58:49,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 10:58:49,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +10: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +63: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 10:58:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +18: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +27: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 10:58:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +38: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +29: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 10:58:49,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +16: [2023-04-29 10:58:49,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 10:58:49,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +12: [2023-04-29 10:58:49,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 10:58:49,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:49,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +29: [2023-04-29 10:58:49,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 4: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 10:58:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 10:58:49,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +52: [2023-04-29 10:58:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +52: [2023-04-29 10:58:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +52: [2023-04-29 10:58:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +52: [2023-04-29 10:58:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +13: [2023-04-29 10:58:49,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 10:58:49,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 10:58:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 10:58:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 10:58:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 10:58:49,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 10:58:49,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +63: [2023-04-29 10:58:49,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 10:58:49,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +62: [2023-04-29 10:58:49,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 10:58:49,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 10:58:49,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:49,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:49,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:49,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:49,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 10:58:49,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 10:58:49,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 10:58:49,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:49,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 10:58:49,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 10:58:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:49,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 10:58:49,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:49,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:49,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 10:58:49,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 10:58:49,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 10:58:49,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 10:58:49,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 10:58:49,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 10:58:49,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:49,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 10:58:49,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 10:58:49,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:49,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:49,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +39: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +24: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 10:58:49,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +52: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 5: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 10:58:49,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:49,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 5: [2023-04-29 10:58:49,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:49,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 10:58:49,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +26: [2023-04-29 10:58:49,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 10:58:49,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 10:58:49,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 10:58:49,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:49,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:49,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 10:58:49,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 10:58:49,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 10:58:49,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 10:58:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 10:58:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 10:58:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 10:58:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 10:58:49,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +42: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +42: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +26: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +42: [2023-04-29 10:58:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +42: [2023-04-29 10:58:49,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +14: [2023-04-29 10:58:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 10:58:49,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 10:58:49,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +15: [2023-04-29 10:58:49,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:49,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 10:58:49,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +15: [2023-04-29 10:58:49,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +15: [2023-04-29 10:58:49,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +25: [2023-04-29 10:58:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 10:58:49,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:49,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 10:58:49,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 10:58:49,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 10:58:49,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 10:58:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 10:58:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:49,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:49,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:49,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +21: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +63: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +21: [2023-04-29 10:58:49,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +21: [2023-04-29 10:58:49,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +63: [2023-04-29 10:58:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 10:58:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 10:58:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 10:58:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 10:58:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 10:58:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:49,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:49,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 10:58:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:49,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 10:58:49,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +25: [2023-04-29 10:58:49,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 10:58:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +51: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 10:58:49,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:49,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +42: [2023-04-29 10:58:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 10:58:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 10:58:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 10:58:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 10:58:49,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +59: [2023-04-29 10:58:49,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 10:58:49,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 10:58:49,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 10:58:49,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +19: [2023-04-29 10:58:49,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:49,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 10:58:49,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 10:58:49,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 10:58:49,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +19: [2023-04-29 10:58:49,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 10:58:49,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 10:58:49,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:49,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:49,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +42: [2023-04-29 10:58:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:49,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 10:58:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 10:58:49,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 10:58:49,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +32: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +14: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 10:58:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +32: [2023-04-29 10:58:49,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 10:58:49,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 10:58:49,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 10:58:49,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +23: [2023-04-29 10:58:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 10:58:49,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 10:58:49,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 10:58:49,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 10:58:49,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +14: [2023-04-29 10:58:49,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 10:58:49,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +57: [2023-04-29 10:58:49,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +12: [2023-04-29 10:58:49,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 10:58:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +49: [2023-04-29 10:58:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +49: [2023-04-29 10:58:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +23: [2023-04-29 10:58:49,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +49: [2023-04-29 10:58:49,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 10:58:49,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:49,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 10:58:49,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:49,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:49,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +42: [2023-04-29 10:58:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 10:58:49,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:49,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +12: [2023-04-29 10:58:49,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 10:58:49,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 10:58:49,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:49,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +23: [2023-04-29 10:58:49,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +23: [2023-04-29 10:58:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:49,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +42: [2023-04-29 10:58:49,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 10:58:49,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:49,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 10:58:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 10:58:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +32: [2023-04-29 10:58:49,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:49,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 10:58:49,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 10:58:49,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 10:58:49,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 10:58:49,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +42: [2023-04-29 10:58:49,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 10:58:49,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 10:58:49,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 10:58:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 10:58:49,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 10:58:49,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +48: [2023-04-29 10:58:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 10:58:49,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 1: [2023-04-29 10:58:49,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 1: [2023-04-29 10:58:49,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 10:58:49,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +63: [2023-04-29 10:58:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 10:58:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 10:58:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 10:58:49,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 10:58:49,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 10:58:49,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +42: [2023-04-29 10:58:49,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 10:58:49,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +56: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:49,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:49,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:49,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:49,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +42: [2023-04-29 10:58:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 10:58:49,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +51: [2023-04-29 10:58:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 10:58:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 10:58:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +59: [2023-04-29 10:58:49,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 10:58:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:49,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 10:58:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 10:58:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +14: [2023-04-29 10:58:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 3: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 10:58:49,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 10:58:49,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 10:58:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:49,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +59: [2023-04-29 10:58:49,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 10:58:49,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 10:58:49,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +59: [2023-04-29 10:58:49,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 10:58:49,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 10:58:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +59: [2023-04-29 10:58:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +57: [2023-04-29 10:58:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +25: [2023-04-29 10:58:49,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 10:58:49,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 10:58:49,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 10:58:49,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 10:58:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 10:58:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 10:58:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 10:58:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 10:58:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +51: [2023-04-29 10:58:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +56: [2023-04-29 10:58:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:49,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 10:58:49,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 10:58:49,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 10:58:49,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 10:58:49,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:49,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:49,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 10:58:49,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 10:58:49,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +57: [2023-04-29 10:58:49,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 10:58:49,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:49,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +34: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +34: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 5: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 10:58:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +31: [2023-04-29 10:58:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 10:58:49,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 10:58:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:49,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:49,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:49,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 10:58:49,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 10:58:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 10:58:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:49,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +47: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:49,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +49: [2023-04-29 10:58:49,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 10:58:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:49,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:49,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:49,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +58: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +17: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 10:58:49,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 10:58:49,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 10:58:49,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +31: [2023-04-29 10:58:49,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:49,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +20: [2023-04-29 10:58:49,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 10:58:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 10:58:49,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 10:58:49,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +23: [2023-04-29 10:58:49,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 10:58:49,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 10:58:49,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 10:58:49,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 10:58:49,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +41: [2023-04-29 10:58:49,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:49,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +34: [2023-04-29 10:58:49,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +34: [2023-04-29 10:58:49,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 10:58:49,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +41: [2023-04-29 10:58:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:49,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 10:58:49,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 10:58:49,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:49,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 10:58:49,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:49,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 10:58:49,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 10:58:49,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 10:58:49,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 1: [2023-04-29 10:58:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 1: [2023-04-29 10:58:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +33: [2023-04-29 10:58:49,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 10:58:49,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:49,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 10:58:49,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 10:58:49,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:49,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:49,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:49,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:49,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:49,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:49,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 10:58:49,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:49,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:49,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:49,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:49,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:49,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +31: [2023-04-29 10:58:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 10:58:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:49,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:49,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 10:58:49,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:49,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:49,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +56: [2023-04-29 10:58:49,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 10:58:49,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:49,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 10:58:49,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 10:58:49,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 10:58:49,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 10:58:49,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +35: [2023-04-29 10:58:49,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 10:58:49,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 10:58:49,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 10:58:49,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 10:58:49,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 10:58:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +53: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +53: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +28: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +29: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:49,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:49,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:49,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +44: [2023-04-29 10:58:49,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 10:58:49,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +29: [2023-04-29 10:58:49,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 10:58:49,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 10:58:49,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 10:58:49,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:49,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 10:58:49,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:49,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:49,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +17: [2023-04-29 10:58:49,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +58: [2023-04-29 10:58:49,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +58: [2023-04-29 10:58:49,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +17: [2023-04-29 10:58:49,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 10:58:49,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 10:58:49,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +34: [2023-04-29 10:58:49,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 10:58:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 10:58:49,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 10:58:49,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 10:58:49,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +47: [2023-04-29 10:58:49,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:49,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:49,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:49,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:49,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +35: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 10:58:49,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 10:58:49,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 10:58:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +47: [2023-04-29 10:58:49,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 10:58:49,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 10:58:49,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +30: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:49,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 10:58:49,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 10:58:49,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 10:58:49,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:49,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +30: [2023-04-29 10:58:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 10:58:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 10:58:49,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 10:58:49,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 10:58:49,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 10:58:49,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:49,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +35: [2023-04-29 10:58:49,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:49,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 10:58:49,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 10:58:49,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 10:58:49,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 10:58:49,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +17: [2023-04-29 10:58:49,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:49,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:49,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 6: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +15: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +15: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:49,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 10:58:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 10:58:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 7: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +55: [2023-04-29 10:58:49,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:49,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 10:58:49,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:49,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 10:58:49,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 10:58:49,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 10:58:49,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:49,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 10:58:49,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 10:58:49,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:49,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 10:58:49,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +22: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +22: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +33: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 10:58:49,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:49,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 10:58:49,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:49,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +15: [2023-04-29 10:58:49,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:49,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 10:58:49,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +50: [2023-04-29 10:58:49,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 10:58:49,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 10:58:49,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 10:58:49,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +15: [2023-04-29 10:58:49,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:49,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +11: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 10:58:49,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:49,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:49,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 10:58:49,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 10:58:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 10:58:49,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:49,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:49,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:49,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:49,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:49,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 10:58:49,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:49,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 10:58:49,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:49,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +36: [2023-04-29 10:58:49,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 10:58:49,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 10:58:49,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +36: [2023-04-29 10:58:49,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:49,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 10:58:49,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +22: [2023-04-29 10:58:49,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:49,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:49,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 10:58:49,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 10:58:49,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:49,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:49,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 10:58:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 10:58:49,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 10:58:49,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:49,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +50: [2023-04-29 10:58:49,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 10:58:49,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:49,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +50: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:49,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:49,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:49,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 10:58:49,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +58: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:49,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 0: [2023-04-29 10:58:49,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 10:58:49,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 10:58:49,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +53: [2023-04-29 10:58:49,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 10:58:49,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +55: [2023-04-29 10:58:49,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:49,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:49,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:49,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 10:58:49,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:49,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:49,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +45: [2023-04-29 10:58:49,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +45: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +35: [2023-04-29 10:58:49,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:49,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:49,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 10:58:49,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:49,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:49,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 10:58:49,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:49,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:49,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:49,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 10:58:49,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:49,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:49,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:49,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:49,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 10:58:49,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 10:58:49,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 10:58:49,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +30: [2023-04-29 10:58:49,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 10:58:49,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:49,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 10:58:49,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:49,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 10:58:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 10:58:49,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 10:58:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 10:58:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 10:58:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 10:58:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 10:58:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 10:58:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +55: [2023-04-29 10:58:49,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 10:58:49,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:49,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:49,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 10:58:49,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 10:58:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 10:58:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +24: [2023-04-29 10:58:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:49,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 10:58:49,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:49,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 10:58:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 10:58:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +33: [2023-04-29 10:58:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 10:58:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +61: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +61: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +12: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:49,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +33: [2023-04-29 10:58:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +35: [2023-04-29 10:58:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +35: [2023-04-29 10:58:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 7: [2023-04-29 10:58:49,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:49,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:49,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 10:58:49,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 10:58:49,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:49,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:49,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 10:58:49,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 10:58:49,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 10:58:49,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 10:58:49,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 10:58:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 10:58:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:49,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 10:58:49,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 10:58:49,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 10:58:49,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:49,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:49,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:49,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 10:58:49,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 10:58:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 10:58:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +21: [2023-04-29 10:58:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +21: [2023-04-29 10:58:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +21: [2023-04-29 10:58:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:49,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:49,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +37: [2023-04-29 10:58:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 10:58:49,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +37: [2023-04-29 10:58:49,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:49,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 10:58:49,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +56: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:49,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +49: [2023-04-29 10:58:49,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:49,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:49,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:49,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:49,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:49,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +45: [2023-04-29 10:58:49,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:49,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:49,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:49,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:49,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:49,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 10:58:49,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:49,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:49,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 10:58:49,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:49,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:49,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +23: [2023-04-29 10:58:49,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 10:58:49,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 10:58:49,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:49,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:49,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +56: [2023-04-29 10:58:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 10:58:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +23: [2023-04-29 10:58:49,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +45: [2023-04-29 10:58:49,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 10:58:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 4: [2023-04-29 10:58:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:49,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:49,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:49,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:49,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 10:58:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:49,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 10:58:49,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 10:58:49,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:49,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:49,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 10:58:49,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 10:58:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 10:58:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 10:58:49,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +62: [2023-04-29 10:58:49,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:49,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:50,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 10:58:50,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +62: [2023-04-29 10:58:50,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:50,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +62: [2023-04-29 10:58:50,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 10:58:50,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:50,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 10:58:50,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 10:58:50,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:50,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 10:58:50,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:50,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:50,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:50,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +45: [2023-04-29 10:58:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +40: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +40: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 10:58:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt. +23: [2023-04-29 10:58:50,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 10:58:50,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:50,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 10:58:50,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 10:58:50,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 10:58:50,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +19: [2023-04-29 10:58:50,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +19: [2023-04-29 10:58:50,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +19: [2023-04-29 10:58:50,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 10:58:50,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 10:58:50,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 10:58:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +36: [2023-04-29 10:58:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +36: [2023-04-29 10:58:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +61: [2023-04-29 10:58:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +31: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +36: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:50,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:50,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +36: [2023-04-29 10:58:50,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +36: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +20: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +20: [2023-04-29 10:58:50,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +61: [2023-04-29 10:58:50,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 10:58:50,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:50,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:50,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:50,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 10:58:50,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 10:58:50,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 10:58:50,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 10:58:50,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 10:58:50,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:50,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +40: [2023-04-29 10:58:50,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 10:58:50,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 10:58:50,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:50,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 10:58:50,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 10:58:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +40: [2023-04-29 10:58:50,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 10:58:50,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 10:58:50,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 10:58:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +61: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +43: [2023-04-29 10:58:50,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:50,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:50,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +19: [2023-04-29 10:58:50,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +43: [2023-04-29 10:58:50,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +43: [2023-04-29 10:58:50,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +43: [2023-04-29 10:58:50,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +19: [2023-04-29 10:58:50,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 10:58:50,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:50,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 10:58:50,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +49: [2023-04-29 10:58:50,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:50,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 10:58:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:50,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:50,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 10:58:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:50,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:50,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 10:58:50,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:50,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:50,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 10:58:50,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 10:58:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 10:58:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 10:58:50,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:50,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +41: [2023-04-29 10:58:50,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +41: [2023-04-29 10:58:50,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +41: [2023-04-29 10:58:50,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 10:58:50,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:50,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:50,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:50,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 10:58:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 10:58:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 10:58:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 10:58:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 10:58:50,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +28: [2023-04-29 10:58:50,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 10:58:50,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 10:58:50,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 10:58:50,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +50: [2023-04-29 10:58:50,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 10:58:50,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 10:58:50,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:50,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:50,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 10:58:50,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 10:58:50,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +40: [2023-04-29 10:58:50,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 10:58:50,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 10:58:50,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +62: [2023-04-29 10:58:50,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 10:58:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 10:58:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 10:58:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 10:58:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +19: [2023-04-29 10:58:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 10:58:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +40: [2023-04-29 10:58:50,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 10:58:50,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:50,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 10:58:50,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +40: [2023-04-29 10:58:50,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt... +14: [2023-04-29 10:58:50,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:50,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:50,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:50,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 10:58:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 10:58:50,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 10:58:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 10:58:50,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 10:58:50,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:50,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +18: [2023-04-29 10:58:50,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 10:58:50,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 10:58:50,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 10:58:50,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 10:58:50,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 10:58:50,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 10:58:50,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 10:58:50,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 10:58:50,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +18: [2023-04-29 10:58:50,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 10:58:50,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 10:58:50,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 10:58:50,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 10:58:50,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 10:58:50,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:50,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 10:58:50,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:50,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 10:58:50,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 10:58:50,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 10:58:50,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +50: [2023-04-29 10:58:50,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 10:58:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 10:58:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 10:58:50,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:50,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 10:58:50,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +36: [2023-04-29 10:58:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 10:58:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 10:58:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +32: [2023-04-29 10:58:50,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +18: [2023-04-29 10:58:50,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 10:58:50,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 10:58:50,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:50,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:50,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:50,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 10:58:50,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 10:58:50,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 10:58:50,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 10:58:50,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:50,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 10:58:50,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 10:58:50,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:50,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +43: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +47: [2023-04-29 10:58:50,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +32: [2023-04-29 10:58:50,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:50,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:50,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:50,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +54: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +45: [2023-04-29 10:58:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 10:58:50,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:50,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +45: [2023-04-29 10:58:50,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 10:58:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +55: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +14: [2023-04-29 10:58:50,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 10:58:50,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +39: [2023-04-29 10:58:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:50,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 10:58:50,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 10:58:50,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 10:58:50,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +14: [2023-04-29 10:58:50,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +41: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:50,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:50,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 10:58:50,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +57: [2023-04-29 10:58:50,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +22: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +38: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +41: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +22: [2023-04-29 10:58:50,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 10:58:50,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +38: [2023-04-29 10:58:50,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 10:58:50,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +22: [2023-04-29 10:58:50,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:50,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:50,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 10:58:50,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 10:58:50,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 10:58:50,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:50,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +28: [2023-04-29 10:58:50,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 10:58:50,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 10:58:50,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 10:58:50,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 10:58:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 10:58:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 10:58:50,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 10:58:50,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:50,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 10:58:50,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:50,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 10:58:50,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +49: [2023-04-29 10:58:50,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 10:58:50,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 10:58:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 10:58:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 10:58:50,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 10:58:50,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +28: [2023-04-29 10:58:50,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 10:58:50,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 10:58:50,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 10:58:50,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 10:58:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 10:58:50,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 10:58:50,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 10:58:50,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 10:58:50,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:50,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:50,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:50,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:50,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 10:58:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 10:58:50,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 10:58:50,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 10:58:50,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 10:58:50,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 10:58:50,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 10:58:50,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 10:58:50,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:50,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:50,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 10:58:50,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 10:58:50,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 10:58:50,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 10:58:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 10:58:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +31: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +31: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +49: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 10:58:50,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 10:58:50,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 10:58:50,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:50,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 10:58:50,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:50,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +32: [2023-04-29 10:58:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +32: [2023-04-29 10:58:50,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +32: [2023-04-29 10:58:50,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +46: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +46: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +37: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:50,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 10:58:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +46: [2023-04-29 10:58:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 10:58:50,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:50,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +59: [2023-04-29 10:58:50,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +46: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +46: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +51: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +51: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +10: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +31: [2023-04-29 10:58:50,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 10:58:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +29: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +29: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +29: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +38: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +29: [2023-04-29 10:58:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 10:58:50,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +27: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +27: [2023-04-29 10:58:50,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 10:58:50,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:50,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 10:58:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 10:58:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 10:58:50,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 10:58:50,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 10:58:50,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:50,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 10:58:50,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 10:58:50,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 10:58:50,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 10:58:50,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 10:58:50,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 10:58:50,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:50,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 10:58:50,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 10:58:50,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 10:58:50,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +17: [2023-04-29 10:58:50,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 10:58:50,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 10:58:50,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +11: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +32: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +11: [2023-04-29 10:58:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 10:58:50,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +58: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +59: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +50: [2023-04-29 10:58:50,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 10:58:50,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 10:58:50,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 10:58:50,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +22: [2023-04-29 10:58:50,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 10:58:50,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 10:58:50,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 10:58:50,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:50,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:50,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 10:58:50,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 10:58:50,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 10:58:50,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 10:58:50,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 10:58:50,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 10:58:50,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:50,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 10:58:50,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 10:58:50,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 10:58:50,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 10:58:50,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:50,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 10:58:50,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +62: [2023-04-29 10:58:50,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:50,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 10:58:50,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +27: [2023-04-29 10:58:50,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:50,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 10:58:50,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +63: [2023-04-29 10:58:50,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:50,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 10:58:50,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:50,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +36: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +29: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 10:58:50,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:50,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 10:58:50,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +36: [2023-04-29 10:58:50,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:50,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 10:58:50,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +13: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +49: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 10:58:50,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 10:58:50,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +57: [2023-04-29 10:58:50,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:50,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 10:58:50,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 10:58:50,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 10:58:50,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +49: [2023-04-29 10:58:50,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:50,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 10:58:50,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:50,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +52: [2023-04-29 10:58:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 10:58:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 10:58:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +58: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +50: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 10:58:50,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 10:58:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +21: [2023-04-29 10:58:50,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +58: [2023-04-29 10:58:50,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 10:58:50,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 10:58:50,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +47: [2023-04-29 10:58:50,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +47: [2023-04-29 10:58:50,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +47: [2023-04-29 10:58:50,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +36: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:50,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 10:58:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +10: [2023-04-29 10:58:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 10:58:50,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 10:58:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +36: [2023-04-29 10:58:50,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 10:58:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 10:58:50,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:50,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +36: [2023-04-29 10:58:50,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:50,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:50,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +46: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 10:58:50,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 10:58:50,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 10:58:50,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 10:58:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 10:58:50,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 10:58:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 10:58:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +10: [2023-04-29 10:58:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 10:58:50,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 10:58:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 10:58:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 10:58:50,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 10:58:50,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 10:58:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +47: [2023-04-29 10:58:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 10:58:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 10:58:50,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +43: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +43: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +43: [2023-04-29 10:58:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +43: [2023-04-29 10:58:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +32: [2023-04-29 10:58:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +32: [2023-04-29 10:58:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 10:58:50,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +25: [2023-04-29 10:58:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +38: [2023-04-29 10:58:50,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 10:58:50,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 10:58:50,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +25: [2023-04-29 10:58:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:50,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +63: [2023-04-29 10:58:50,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +46: [2023-04-29 10:58:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +30: [2023-04-29 10:58:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 10:58:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 10:58:50,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +29: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +27: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +30: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 10:58:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 10:58:50,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 10:58:50,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 10:58:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 10:58:50,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +38: [2023-04-29 10:58:50,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:50,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 10:58:50,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 10:58:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 10:58:50,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 10:58:50,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:50,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:50,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 10:58:50,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:50,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +29: [2023-04-29 10:58:50,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +13: [2023-04-29 10:58:50,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:50,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +19: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +52: [2023-04-29 10:58:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +13: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 10:58:50,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 10:58:50,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:50,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 10:58:50,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +59: [2023-04-29 10:58:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +14: [2023-04-29 10:58:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 10:58:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +13: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +48: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 10:58:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 10:58:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +11: [2023-04-29 10:58:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +43: [2023-04-29 10:58:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +59: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +59: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +59: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:50,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +16: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 10:58:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 10:58:50,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +59: [2023-04-29 10:58:50,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:50,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 10:58:50,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +13: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +25: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 10:58:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:50,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 10:58:50,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 10:58:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +52: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +15: [2023-04-29 10:58:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 10:58:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +52: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +15: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +57: [2023-04-29 10:58:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 10:58:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 10:58:50,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 10:58:50,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 10:58:50,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +52: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 10:58:50,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +15: [2023-04-29 10:58:50,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 10:58:50,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 10:58:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:50,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 10:58:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 10:58:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:50,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +41: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +41: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +41: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 10:58:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +56: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +12: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +12: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +56: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +12: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +56: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +12: [2023-04-29 10:58:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 10:58:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:50,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 10:58:50,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 10:58:50,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 10:58:50,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +16: [2023-04-29 10:58:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 10:58:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +47: [2023-04-29 10:58:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +60: [2023-04-29 10:58:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 10:58:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:50,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 10:58:50,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 10:58:50,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 10:58:50,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 10:58:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +52: [2023-04-29 10:58:50,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 10:58:50,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 10:58:50,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +39: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +25: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +39: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:50,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 10:58:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 10:58:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 10:58:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:50,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 10:58:50,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 10:58:50,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +12: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +28: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +28: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +23: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +41: [2023-04-29 10:58:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 10:58:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 10:58:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 10:58:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 10:58:50,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 10:58:50,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 10:58:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +12: [2023-04-29 10:58:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 10:58:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 10:58:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +57: [2023-04-29 10:58:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 10:58:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 10:58:50,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 10:58:50,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +59: [2023-04-29 10:58:50,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 10:58:50,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 10:58:50,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 10:58:50,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 10:58:50,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +34: [2023-04-29 10:58:50,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 10:58:50,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 10:58:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +20: [2023-04-29 10:58:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +59: [2023-04-29 10:58:50,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:50,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +57: [2023-04-29 10:58:50,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:50,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 10:58:50,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 10:58:50,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 10:58:50,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 10:58:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 10:58:50,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 10:58:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 10:58:50,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:50,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 10:58:50,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 10:58:50,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +28: [2023-04-29 10:58:50,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +25: [2023-04-29 10:58:50,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +48: [2023-04-29 10:58:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +15: [2023-04-29 10:58:50,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 10:58:50,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 10:58:50,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 10:58:50,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:50,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 10:58:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:50,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:50,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +15: [2023-04-29 10:58:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 10:58:50,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 10:58:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 10:58:50,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +53: [2023-04-29 10:58:50,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 10:58:50,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 10:58:50,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 10:58:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 10:58:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 10:58:50,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 10:58:50,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 10:58:50,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 10:58:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 10:58:50,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +59: [2023-04-29 10:58:50,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +61: [2023-04-29 10:58:50,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +61: [2023-04-29 10:58:50,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +61: [2023-04-29 10:58:50,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 10:58:50,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 10:58:50,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +46: [2023-04-29 10:58:50,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +46: [2023-04-29 10:58:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +46: [2023-04-29 10:58:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 10:58:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 10:58:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 10:58:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 10:58:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +15: [2023-04-29 10:58:50,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +60: [2023-04-29 10:58:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 10:58:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +53: [2023-04-29 10:58:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 10:58:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 10:58:50,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 10:58:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 10:58:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +53: [2023-04-29 10:58:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:50,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 10:58:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 10:58:50,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 10:58:50,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:50,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 10:58:50,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 10:58:50,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +25: [2023-04-29 10:58:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 10:58:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +15: [2023-04-29 10:58:50,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +53: [2023-04-29 10:58:50,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 10:58:50,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 10:58:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +33: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +33: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +33: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +56: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +25: [2023-04-29 10:58:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 10:58:50,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 10:58:50,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +56: [2023-04-29 10:58:50,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +56: [2023-04-29 10:58:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 10:58:50,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:50,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 10:58:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 10:58:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 10:58:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 10:58:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 10:58:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 10:58:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +56: [2023-04-29 10:58:50,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 10:58:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:50,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... +12: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +35: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 10:58:50,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 10:58:50,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +49: [2023-04-29 10:58:50,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 10:58:50,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +49: [2023-04-29 10:58:50,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:50,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 10:58:50,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 10:58:50,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 10:58:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 10:58:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 10:58:50,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 10:58:50,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:50,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 10:58:50,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:50,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:50,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:50,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 10:58:50,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 10:58:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 10:58:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +17: [2023-04-29 10:58:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 10:58:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +17: [2023-04-29 10:58:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 10:58:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:50,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +40: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 10:58:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 10:58:50,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 10:58:50,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +60: [2023-04-29 10:58:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 10:58:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +57: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 10:58:50,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 10:58:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 10:58:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +20: [2023-04-29 10:58:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:50,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 10:58:50,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +60: [2023-04-29 10:58:50,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 10:58:50,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 10:58:50,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 10:58:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 10:58:50,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:50,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 10:58:50,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 10:58:50,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 10:58:50,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 10:58:50,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 10:58:50,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +24: [2023-04-29 10:58:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 10:58:50,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +61: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +52: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +52: [2023-04-29 10:58:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +52: [2023-04-29 10:58:50,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 10:58:50,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +34: [2023-04-29 10:58:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 10:58:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 10:58:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +57: [2023-04-29 10:58:50,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:50,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 10:58:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 10:58:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 10:58:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 10:58:50,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 10:58:50,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 10:58:50,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 10:58:50,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 10:58:50,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 10:58:50,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +30: [2023-04-29 10:58:50,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +40: [2023-04-29 10:58:50,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 10:58:50,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 10:58:50,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:50,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 10:58:50,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 10:58:50,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +52: [2023-04-29 10:58:50,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 10:58:50,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 10:58:50,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +33: [2023-04-29 10:58:50,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +52: [2023-04-29 10:58:50,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 10:58:50,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +31: [2023-04-29 10:58:50,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 10:58:50,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 10:58:50,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 10:58:50,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 10:58:50,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +31: [2023-04-29 10:58:50,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +54: [2023-04-29 10:58:50,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:50,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +32: [2023-04-29 10:58:50,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +32: [2023-04-29 10:58:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +31: [2023-04-29 10:58:50,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +32: [2023-04-29 10:58:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +17: [2023-04-29 10:58:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +63: [2023-04-29 10:58:50,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +31: [2023-04-29 10:58:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 10:58:50,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 10:58:50,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +31: [2023-04-29 10:58:50,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +31: [2023-04-29 10:58:50,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +17: [2023-04-29 10:58:50,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +17: [2023-04-29 10:58:50,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:50,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 2: [2023-04-29 10:58:50,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 10:58:50,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 10:58:50,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +23: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +23: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 10:58:50,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +11: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 10:58:50,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:50,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 10:58:50,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:50,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:50,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 10:58:50,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:50,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 10:58:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 10:58:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 10:58:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 10:58:50,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 10:58:50,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +63: [2023-04-29 10:58:50,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +63: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +63: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +63: [2023-04-29 10:58:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +40: [2023-04-29 10:58:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 10:58:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 10:58:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 10:58:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 10:58:50,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 10:58:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +40: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +24: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:50,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 10:58:50,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 10:58:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 10:58:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +28: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +28: [2023-04-29 10:58:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 10:58:50,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +27: [2023-04-29 10:58:50,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:50,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:50,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:50,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:50,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 10:58:50,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:50,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:50,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:50,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +13: [2023-04-29 10:58:50,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 10:58:50,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +21: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +21: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +13: [2023-04-29 10:58:50,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:50,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +22: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +22: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 10:58:50,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 10:58:50,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 10:58:50,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 10:58:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 10:58:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 10:58:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:50,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 10:58:50,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 2: [2023-04-29 10:58:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +61: [2023-04-29 10:58:50,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:50,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:50,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:50,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:50,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 10:58:50,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 10:58:50,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 10:58:50,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 10:58:50,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +22: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 10:58:50,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 10:58:50,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 10:58:50,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +14: [2023-04-29 10:58:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +14: [2023-04-29 10:58:50,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +14: [2023-04-29 10:58:50,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 10:58:50,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +31: [2023-04-29 10:58:50,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:50,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 10:58:50,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 10:58:50,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 10:58:50,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 10:58:50,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +25: [2023-04-29 10:58:50,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 9: [2023-04-29 10:58:50,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +11: [2023-04-29 10:58:50,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:50,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 10:58:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 10:58:50,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 10:58:50,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 4: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 10:58:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 10:58:50,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +28: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 10:58:50,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +27: [2023-04-29 10:58:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +63: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +14: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +13: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 10:58:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +14: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 10:58:50,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +11: [2023-04-29 10:58:50,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +16: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +13: [2023-04-29 10:58:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +55: [2023-04-29 10:58:50,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 10:58:50,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 10:58:50,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:50,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +28: [2023-04-29 10:58:50,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:50,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +35: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +16: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 10:58:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 10:58:50,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 10:58:50,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +35: [2023-04-29 10:58:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:50,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 10:58:50,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:50,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 10:58:50,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:50,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 10:58:50,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 10:58:50,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 10:58:50,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 10:58:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:50,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 10:58:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 10:58:50,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 10:58:50,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 10:58:50,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 10:58:50,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 10:58:50,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 10:58:50,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +38: [2023-04-29 10:58:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 10:58:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 10:58:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 10:58:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +21: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:50,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 10:58:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 1: [2023-04-29 10:58:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:50,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 10:58:50,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +21: [2023-04-29 10:58:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 10:58:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 10:58:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +10: [2023-04-29 10:58:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +35: [2023-04-29 10:58:50,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:50,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 10:58:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 10:58:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +10: [2023-04-29 10:58:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 10:58:50,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 10:58:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 10:58:50,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 10:58:50,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 10:58:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +58: [2023-04-29 10:58:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +58: [2023-04-29 10:58:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +58: [2023-04-29 10:58:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 10:58:50,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +29: [2023-04-29 10:58:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +27: [2023-04-29 10:58:50,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 10:58:50,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:50,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 10:58:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 10:58:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +20: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +20: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +20: [2023-04-29 10:58:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 10:58:50,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 10:58:50,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +38: [2023-04-29 10:58:50,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:50,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +27: [2023-04-29 10:58:50,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 10:58:50,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 10:58:50,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 10:58:50,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 10:58:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 10:58:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 4: [2023-04-29 10:58:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 10:58:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 10:58:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 10:58:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 10:58:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +12: [2023-04-29 10:58:50,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 4: [2023-04-29 10:58:50,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 10:58:50,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:50,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 10:58:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +51: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +18: [2023-04-29 10:58:50,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +16: [2023-04-29 10:58:50,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 10:58:50,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:50,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt... +25: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +58: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +58: [2023-04-29 10:58:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 10:58:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:50,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 10:58:50,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +18: [2023-04-29 10:58:50,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 10:58:50,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 4: [2023-04-29 10:58:50,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 10:58:50,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +59: [2023-04-29 10:58:50,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +12: [2023-04-29 10:58:50,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 10:58:50,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:50,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +59: [2023-04-29 10:58:50,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:50,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:50,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 10:58:50,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 10:58:50,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 10:58:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +25: [2023-04-29 10:58:50,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:50,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 10:58:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 10:58:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 10:58:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 10:58:50,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 10:58:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 10:58:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 10:58:50,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 10:58:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +30: [2023-04-29 10:58:50,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:50,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 10:58:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 10:58:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:50,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:50,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 10:58:50,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 10:58:50,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 10:58:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 10:58:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 10:58:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 10:58:50,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:50,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 10:58:50,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 10:58:50,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:50,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +26: [2023-04-29 10:58:50,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 10:58:50,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 10:58:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +12: [2023-04-29 10:58:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:50,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 10:58:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 10:58:50,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 10:58:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 10:58:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:50,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 10:58:50,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 10:58:50,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:50,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 10:58:50,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 10:58:50,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 10:58:50,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 10:58:50,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:50,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 10:58:50,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:50,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:50,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:50,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:50,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 10:58:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 10:58:50,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:50,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 10:58:50,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:50,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 10:58:50,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:50,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 10:58:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 10:58:50,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +10: [2023-04-29 10:58:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 10:58:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +12: [2023-04-29 10:58:50,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 10:58:50,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:50,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +12: [2023-04-29 10:58:50,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +56: [2023-04-29 10:58:50,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 10:58:50,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:50,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 10:58:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 10:58:50,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 10:58:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt... +22: [2023-04-29 10:58:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 10:58:50,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 10:58:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 10:58:50,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 10:58:50,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 3: [2023-04-29 10:58:50,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:50,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:50,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:50,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 10:58:50,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 10:58:50,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:50,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 10:58:50,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +51: [2023-04-29 10:58:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 10:58:50,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:50,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 10:58:50,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 10:58:50,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +19: [2023-04-29 10:58:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 10:58:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 10:58:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 10:58:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 7: [2023-04-29 10:58:50,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 10:58:50,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:50,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:50,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:50,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:50,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 10:58:50,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:50,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:50,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 10:58:50,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 10:58:50,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:50,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:50,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:50,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:50,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:50,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:50,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 10:58:50,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:50,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 10:58:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 10:58:50,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:50,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +26: [2023-04-29 10:58:50,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:50,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:50,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 10:58:50,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +48: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +48: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +48: [2023-04-29 10:58:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +22: [2023-04-29 10:58:50,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 10:58:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:50,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 10:58:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 0: [2023-04-29 10:58:50,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 10:58:50,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:50,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 10:58:50,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 10:58:50,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 10:58:50,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +22: [2023-04-29 10:58:50,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 10:58:50,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:50,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 10:58:50,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 10:58:50,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 10:58:50,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 10:58:50,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +48: [2023-04-29 10:58:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:50,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:50,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:50,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:50,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 10:58:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 10:58:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 10:58:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 10:58:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:50,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:50,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 10:58:50,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 10:58:50,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:50,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 10:58:50,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 10:58:51,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:51,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:51,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:51,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 10:58:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +22: [2023-04-29 10:58:51,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 10:58:51,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 10:58:51,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 10:58:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +47: [2023-04-29 10:58:51,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:51,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +56: [2023-04-29 10:58:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +56: [2023-04-29 10:58:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 10:58:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +19: [2023-04-29 10:58:51,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +17: [2023-04-29 10:58:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +17: [2023-04-29 10:58:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +17: [2023-04-29 10:58:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +17: [2023-04-29 10:58:51,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +58: [2023-04-29 10:58:51,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:51,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:51,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:51,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 10:58:51,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:51,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 10:58:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:51,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 10:58:51,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +34: [2023-04-29 10:58:51,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 10:58:51,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 10:58:51,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 10:58:51,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 10:58:51,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:51,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +34: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +53: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 10:58:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 10:58:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +33: [2023-04-29 10:58:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +33: [2023-04-29 10:58:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +33: [2023-04-29 10:58:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 10:58:51,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 10:58:51,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 10:58:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:51,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +17: [2023-04-29 10:58:51,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 10:58:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +58: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +60: [2023-04-29 10:58:51,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 10:58:51,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +61: [2023-04-29 10:58:51,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 10:58:51,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:51,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:51,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:51,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +53: [2023-04-29 10:58:51,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:51,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:51,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:51,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 10:58:51,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:51,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:51,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 1: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +61: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 10:58:51,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 1: [2023-04-29 10:58:51,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +49: [2023-04-29 10:58:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 10:58:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:51,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:51,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:51,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 10:58:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:51,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 10:58:51,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +60: [2023-04-29 10:58:51,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 10:58:51,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:51,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:51,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +60: [2023-04-29 10:58:51,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +50: [2023-04-29 10:58:51,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +35: [2023-04-29 10:58:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 2: [2023-04-29 10:58:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 10:58:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 10:58:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 10:58:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +50: [2023-04-29 10:58:51,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 10:58:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 10:58:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 10:58:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 10:58:51,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +27: [2023-04-29 10:58:51,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 10:58:51,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 10:58:51,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 10:58:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 10:58:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 10:58:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 10:58:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 10:58:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 10:58:51,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 10:58:51,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 10:58:51,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 10:58:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:51,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 10:58:51,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 10:58:51,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 10:58:51,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 10:58:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:51,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 10:58:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 10:58:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 10:58:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 10:58:51,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 10:58:51,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 10:58:51,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:51,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +17: [2023-04-29 10:58:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +17: [2023-04-29 10:58:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +61: [2023-04-29 10:58:51,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +27: [2023-04-29 10:58:51,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +17: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +61: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:51,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 3: [2023-04-29 10:58:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 3: [2023-04-29 10:58:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 3: [2023-04-29 10:58:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:51,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:51,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 10:58:51,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +21: [2023-04-29 10:58:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 10:58:51,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 10:58:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 10:58:51,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:51,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:51,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +63: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 10:58:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 10:58:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 10:58:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 10:58:51,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:51,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 10:58:51,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +41: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:51,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 10:58:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 10:58:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 10:58:51,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 10:58:51,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +23: [2023-04-29 10:58:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +23: [2023-04-29 10:58:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +23: [2023-04-29 10:58:51,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +24: [2023-04-29 10:58:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 10:58:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 10:58:51,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 10:58:51,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 10:58:51,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 10:58:51,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 10:58:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 10:58:51,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 10:58:51,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 10:58:51,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 10:58:51,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 10:58:51,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 10:58:51,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 10:58:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 10:58:51,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 10:58:51,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 10:58:51,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +51: [2023-04-29 10:58:51,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:51,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:51,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 10:58:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +15: [2023-04-29 10:58:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 10:58:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +20: [2023-04-29 10:58:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +20: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 10:58:51,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +10: [2023-04-29 10:58:51,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 10:58:51,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 10:58:51,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 10:58:51,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 10:58:51,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 10:58:51,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 10:58:51,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +28: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:51,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +17: [2023-04-29 10:58:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +19: [2023-04-29 10:58:51,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 10:58:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 10:58:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 10:58:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 10:58:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 10:58:51,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 10:58:51,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 5: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 5: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +63: [2023-04-29 10:58:51,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 10:58:51,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 0: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 0: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 0: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +63: [2023-04-29 10:58:51,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 10:58:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 10:58:51,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 10:58:51,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 10:58:51,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +62: [2023-04-29 10:58:51,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:51,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:51,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 10:58:51,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:51,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +41: [2023-04-29 10:58:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 10:58:51,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +18: [2023-04-29 10:58:51,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +18: [2023-04-29 10:58:51,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +18: [2023-04-29 10:58:51,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +62: [2023-04-29 10:58:51,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:51,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +62: [2023-04-29 10:58:51,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 10:58:51,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:51,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +62: [2023-04-29 10:58:51,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 10:58:51,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +17: [2023-04-29 10:58:51,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:51,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 10:58:51,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 10:58:51,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 10:58:51,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 10:58:51,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 10:58:51,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 10:58:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 10:58:51,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 10:58:51,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +22: [2023-04-29 10:58:51,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 10:58:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:51,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 10:58:51,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +14: [2023-04-29 10:58:51,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +14: [2023-04-29 10:58:51,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +14: [2023-04-29 10:58:51,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 10:58:51,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 10:58:51,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +54: [2023-04-29 10:58:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 10:58:51,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +47: [2023-04-29 10:58:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +47: [2023-04-29 10:58:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +25: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +47: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 10:58:51,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:51,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:51,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 10:58:51,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 10:58:51,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 10:58:51,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +20: [2023-04-29 10:58:51,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 10:58:51,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 10:58:51,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +33: [2023-04-29 10:58:51,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +33: [2023-04-29 10:58:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 10:58:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +33: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 2: [2023-04-29 10:58:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 10:58:51,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 10:58:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 10:58:51,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 10:58:51,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 10:58:51,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 10:58:51,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 10:58:51,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 2: [2023-04-29 10:58:51,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 2: [2023-04-29 10:58:51,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:51,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:51,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 10:58:51,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 10:58:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 10:58:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 10:58:51,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +25: [2023-04-29 10:58:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 10:58:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 10:58:51,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 10:58:51,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 10:58:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 10:58:51,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 10:58:51,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 10:58:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 10:58:51,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +62: [2023-04-29 10:58:51,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 10:58:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +61: [2023-04-29 10:58:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 10:58:51,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +39: [2023-04-29 10:58:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 10:58:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 10:58:51,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 10:58:51,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +62: [2023-04-29 10:58:51,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 10:58:51,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:51,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 10:58:51,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 10:58:51,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 10:58:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 10:58:51,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +30: [2023-04-29 10:58:51,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +47: [2023-04-29 10:58:51,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 10:58:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +30: [2023-04-29 10:58:51,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +30: [2023-04-29 10:58:51,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:51,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +31: [2023-04-29 10:58:51,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 2: [2023-04-29 10:58:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +31: [2023-04-29 10:58:51,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:51,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:51,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:51,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 10:58:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 10:58:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 10:58:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +47: [2023-04-29 10:58:51,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 10:58:51,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 10:58:51,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +47: [2023-04-29 10:58:51,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 10:58:51,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +25: [2023-04-29 10:58:51,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 10:58:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 10:58:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 10:58:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 10:58:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +47: [2023-04-29 10:58:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 10:58:51,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 10:58:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 10:58:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 10:58:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 10:58:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +42: [2023-04-29 10:58:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +25: [2023-04-29 10:58:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +42: [2023-04-29 10:58:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 10:58:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 10:58:51,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 10:58:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 10:58:51,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 10:58:51,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:51,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 10:58:51,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 10:58:51,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 6: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 10:58:51,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 10:58:51,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 10:58:51,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 10:58:51,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +17: [2023-04-29 10:58:51,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 6: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 7: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +56: [2023-04-29 10:58:51,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 6: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +37: [2023-04-29 10:58:51,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 10:58:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +37: [2023-04-29 10:58:51,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 10:58:51,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 10:58:51,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 10:58:51,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +37: [2023-04-29 10:58:51,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +37: [2023-04-29 10:58:51,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 10:58:51,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 10:58:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +27: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +44: [2023-04-29 10:58:51,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +27: [2023-04-29 10:58:51,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 10:58:51,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 10:58:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +29: [2023-04-29 10:58:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 10:58:51,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 10:58:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +39: [2023-04-29 10:58:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 10:58:51,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +29: [2023-04-29 10:58:51,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +39: [2023-04-29 10:58:51,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +29: [2023-04-29 10:58:51,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +39: [2023-04-29 10:58:51,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 10:58:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 10:58:51,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 10:58:51,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 10:58:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:51,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 10:58:51,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 10:58:51,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 10:58:51,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 10:58:51,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 10:58:51,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 10:58:51,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +31: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:51,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 10:58:51,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +11: [2023-04-29 10:58:51,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:51,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 10:58:51,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 10:58:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 10:58:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 10:58:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +31: [2023-04-29 10:58:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 10:58:51,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 10:58:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 10:58:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 10:58:51,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +61: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 10:58:51,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 10:58:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 10:58:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 10:58:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 10:58:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 10:58:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +55: [2023-04-29 10:58:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +27: [2023-04-29 10:58:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 10:58:51,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:51,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 10:58:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 10:58:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +56: [2023-04-29 10:58:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +56: [2023-04-29 10:58:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 10:58:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +55: [2023-04-29 10:58:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 6: [2023-04-29 10:58:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +37: [2023-04-29 10:58:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +46: [2023-04-29 10:58:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +46: [2023-04-29 10:58:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +46: [2023-04-29 10:58:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 10:58:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 10:58:51,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:51,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +28: [2023-04-29 10:58:51,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 10:58:51,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 10:58:51,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 10:58:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 10:58:51,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +27: [2023-04-29 10:58:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 10:58:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:51,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 10:58:51,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 10:58:51,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 10:58:51,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 10:58:51,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 10:58:51,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 10:58:51,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +11: [2023-04-29 10:58:51,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 10:58:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 10:58:51,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 10:58:51,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 10:58:51,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 10:58:51,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +11: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 10:58:51,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 10:58:51,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 10:58:51,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 10:58:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +55: [2023-04-29 10:58:51,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 10:58:51,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 10:58:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 10:58:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +57: [2023-04-29 10:58:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +55: [2023-04-29 10:58:51,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 10:58:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +11: [2023-04-29 10:58:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 10:58:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +35: [2023-04-29 10:58:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 10:58:51,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 10:58:51,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 10:58:51,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 10:58:51,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:51,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +61: [2023-04-29 10:58:51,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 10:58:51,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 10:58:51,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 10:58:51,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 10:58:51,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +46: [2023-04-29 10:58:51,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 10:58:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +11: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 10:58:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 10:58:51,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +12: [2023-04-29 10:58:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 10:58:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:51,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 10:58:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 10:58:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 10:58:51,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +35: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:51,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:51,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:51,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 10:58:51,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:51,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 10:58:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:51,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 10:58:51,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:51,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +25: [2023-04-29 10:58:51,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +25: [2023-04-29 10:58:51,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 10:58:51,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 10:58:51,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +25: [2023-04-29 10:58:51,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 10:58:51,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:51,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:51,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:51,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:51,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:51,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:51,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:51,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:51,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:51,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:51,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +22: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +24: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:51,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +24: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +22: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +57: [2023-04-29 10:58:51,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:51,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +63: [2023-04-29 10:58:51,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:51,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 10:58:51,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:51,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 10:58:51,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +31: [2023-04-29 10:58:51,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 10:58:51,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +54: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 10:58:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 10:58:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 10:58:51,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +45: [2023-04-29 10:58:51,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +45: [2023-04-29 10:58:51,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +45: [2023-04-29 10:58:51,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:51,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +57: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 7: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 7: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +42: [2023-04-29 10:58:51,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 10:58:51,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 10:58:51,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:51,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:51,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +63: [2023-04-29 10:58:51,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 10:58:51,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 7: [2023-04-29 10:58:51,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 10:58:51,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:51,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 10:58:51,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 10:58:51,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:51,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 10:58:51,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +49: [2023-04-29 10:58:51,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 10:58:51,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +27: [2023-04-29 10:58:51,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +27: [2023-04-29 10:58:51,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +27: [2023-04-29 10:58:51,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 10:58:51,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +24: [2023-04-29 10:58:51,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:51,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:51,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 10:58:51,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:51,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:51,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +26: [2023-04-29 10:58:51,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 10:58:51,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:51,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:51,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:51,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 10:58:51,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +26: [2023-04-29 10:58:51,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 10:58:51,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +26: [2023-04-29 10:58:51,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +57: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +31: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 10:58:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 10:58:51,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +13: [2023-04-29 10:58:51,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +13: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +62: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +45: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 10:58:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +57: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +14: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +42: [2023-04-29 10:58:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 10:58:51,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +29: [2023-04-29 10:58:51,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 10:58:51,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 10:58:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 10:58:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 10:58:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 10:58:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:51,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +14: [2023-04-29 10:58:51,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:51,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 10:58:51,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 10:58:51,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +14: [2023-04-29 10:58:51,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:51,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 10:58:51,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 10:58:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 10:58:51,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 7: [2023-04-29 10:58:51,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +41: [2023-04-29 10:58:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +18: [2023-04-29 10:58:51,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +41: [2023-04-29 10:58:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +41: [2023-04-29 10:58:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +27: [2023-04-29 10:58:51,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:51,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:51,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +49: [2023-04-29 10:58:51,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:51,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:51,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 6: [2023-04-29 10:58:51,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +62: [2023-04-29 10:58:51,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:51,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 10:58:51,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:51,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 10:58:51,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:51,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 10:58:51,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +11: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +58: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +58: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +28: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +28: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +28: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 9: [2023-04-29 10:58:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +50: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +29: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 10:58:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 10:58:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +11: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 10:58:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:51,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 10:58:51,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:51,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 10:58:51,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:51,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:51,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:51,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 10:58:51,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 10:58:51,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:51,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 10:58:51,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 10:58:51,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 10:58:51,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 10:58:51,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 10:58:51,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:51,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:51,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:51,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 10:58:51,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +32: [2023-04-29 10:58:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +52: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +52: [2023-04-29 10:58:51,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +18: [2023-04-29 10:58:51,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 10:58:51,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:51,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 10:58:51,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +28: [2023-04-29 10:58:51,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 10:58:51,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 10:58:51,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +28: [2023-04-29 10:58:51,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +43: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +47: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +47: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +10: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 10:58:51,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 10:58:51,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +32: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +32: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:51,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 10:58:51,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +35: [2023-04-29 10:58:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +16: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +44: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +10: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 10:58:51,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 10:58:51,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:51,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:51,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:51,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +19: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 10:58:51,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +44: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +44: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +44: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +16: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +41: [2023-04-29 10:58:51,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:51,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 10:58:51,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 10:58:51,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:51,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 10:58:51,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:51,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:51,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +35: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +18: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:51,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 10:58:51,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:51,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:51,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:51,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:51,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +45: [2023-04-29 10:58:51,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +19: [2023-04-29 10:58:51,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +26: [2023-04-29 10:58:51,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +44: [2023-04-29 10:58:51,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +44: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +12: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +12: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 10:58:51,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 0: [2023-04-29 10:58:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +38: [2023-04-29 10:58:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 10:58:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:51,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:51,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:51,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:51,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 10:58:51,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:51,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +34: [2023-04-29 10:58:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:51,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:51,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 10:58:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 10:58:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +47: [2023-04-29 10:58:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +47: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:51,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +47: [2023-04-29 10:58:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 10:58:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 10:58:51,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 10:58:51,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 10:58:51,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +13: [2023-04-29 10:58:51,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +13: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 10:58:51,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 10:58:51,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:51,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:51,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 10:58:51,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +59: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 10:58:51,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 10:58:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +18: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +59: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +59: [2023-04-29 10:58:51,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 10:58:51,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 10:58:51,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 10:58:51,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:51,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +62: [2023-04-29 10:58:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:51,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 10:58:51,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:51,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 10:58:51,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:51,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 10:58:51,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:51,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +12: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +62: [2023-04-29 10:58:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +41: [2023-04-29 10:58:51,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:51,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 10:58:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 10:58:51,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 10:58:51,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:51,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:51,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:51,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:51,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:51,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:51,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:51,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:51,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 10:58:51,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:51,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 10:58:51,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 10:58:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 10:58:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 10:58:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:51,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:51,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 10:58:51,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:51,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:51,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:51,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 10:58:51,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:51,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 10:58:51,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +58: [2023-04-29 10:58:51,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 10:58:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 10:58:51,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 10:58:51,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:51,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:51,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 10:58:51,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 10:58:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:51,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 10:58:51,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:51,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 10:58:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 10:58:51,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:51,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:51,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 10:58:51,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 3: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 3: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +34: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 10:58:51,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 10:58:51,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 10:58:51,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 10:58:51,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:51,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 10:58:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 10:58:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:51,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:51,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:51,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 10:58:51,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:51,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:51,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:51,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +44: [2023-04-29 10:58:51,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:51,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 10:58:51,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +60: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:51,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 10:58:51,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:51,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +60: [2023-04-29 10:58:51,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +60: [2023-04-29 10:58:51,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 10:58:51,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 10:58:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:51,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +62: [2023-04-29 10:58:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:51,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +41: [2023-04-29 10:58:51,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:51,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:51,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +36: [2023-04-29 10:58:51,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:51,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 10:58:51,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +36: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +36: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 4: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +39: [2023-04-29 10:58:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 10:58:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 10:58:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 10:58:51,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:51,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 10:58:51,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:51,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:51,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 4: [2023-04-29 10:58:51,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +36: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +53: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +36: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +36: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 10:58:51,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +34: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 4: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +37: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:51,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... +39: [2023-04-29 10:58:51,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:51,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:51,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt... + 4: [2023-04-29 10:58:51,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +61: [2023-04-29 10:58:51,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 10:58:51,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 10:58:51,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:51,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 10:58:51,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... + 0: [2023-04-29 10:58:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 10:58:51,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:51,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:51,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:51,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 10:58:51,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:51,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 10:58:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 10:58:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 10:58:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 10:58:51,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:51,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:51,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:51,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:51,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:51,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:51,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:51,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:51,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 10:58:51,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:51,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:51,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:51,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:51,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:51,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:51,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:51,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 10:58:51,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:51,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:51,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:51,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:51,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 10:58:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 10:58:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 10:58:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +26: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +26: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +26: [2023-04-29 10:58:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 10:58:51,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 10:58:51,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 10:58:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 10:58:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:51,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:51,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 10:58:51,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +13: [2023-04-29 10:58:51,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +13: [2023-04-29 10:58:51,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +13: [2023-04-29 10:58:51,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +44: [2023-04-29 10:58:51,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 10:58:51,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 10:58:51,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 10:58:51,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +56: [2023-04-29 10:58:51,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +16: [2023-04-29 10:58:51,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +56: [2023-04-29 10:58:51,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +56: [2023-04-29 10:58:51,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:51,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:51,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:51,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:51,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 10:58:51,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +33: [2023-04-29 10:58:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +33: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 10:58:51,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +25: [2023-04-29 10:58:51,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +33: [2023-04-29 10:58:51,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 10:58:51,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +25: [2023-04-29 10:58:51,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +53: [2023-04-29 10:58:51,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:51,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 10:58:51,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:51,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 10:58:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:51,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 10:58:51,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:51,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 10:58:51,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 10:58:51,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 10:58:51,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 10:58:51,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:51,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 10:58:51,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:51,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:51,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:51,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:51,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 10:58:51,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 10:58:51,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:51,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 10:58:51,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 10:58:51,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 10:58:51,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 10:58:51,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 10:58:51,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 10:58:51,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:51,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +14: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:51,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 10:58:51,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:51,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 10:58:51,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 10:58:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +53: [2023-04-29 10:58:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +23: [2023-04-29 10:58:51,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 10:58:51,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 10:58:51,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 10:58:51,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 10:58:51,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 10:58:51,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:51,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:51,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +18: [2023-04-29 10:58:51,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 10:58:51,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 10:58:51,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +37: [2023-04-29 10:58:51,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +18: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 10:58:51,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +35: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 10:58:51,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 4: [2023-04-29 10:58:51,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 10:58:51,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 10:58:51,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 10:58:51,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 5: [2023-04-29 10:58:51,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +36: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 5: [2023-04-29 10:58:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 10:58:51,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 10:58:51,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:51,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:51,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:51,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:51,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:51,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:51,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:51,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:51,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:51,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:51,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:51,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 10:58:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:51,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:51,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:51,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 10:58:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 10:58:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 10:58:51,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:51,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 10:58:51,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 10:58:51,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 10:58:51,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 10:58:51,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +30: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +49: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 10:58:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +37: [2023-04-29 10:58:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:51,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:51,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:51,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:51,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:51,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:51,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +30: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 10:58:51,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 10:58:51,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 10:58:51,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 10:58:51,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:51,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:51,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:51,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:51,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:51,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:51,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 10:58:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 10:58:51,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +40: [2023-04-29 10:58:51,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +38: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:51,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 10:58:51,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 10:58:51,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:51,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:51,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:51,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +46: [2023-04-29 10:58:51,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:51,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:51,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 10:58:51,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +25: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 10:58:51,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +33: [2023-04-29 10:58:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 10:58:51,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:51,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +33: [2023-04-29 10:58:51,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 10:58:51,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:51,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:51,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 10:58:51,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 10:58:51,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +56: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +48: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +23: [2023-04-29 10:58:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +48: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:51,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:51,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +61: [2023-04-29 10:58:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +35: [2023-04-29 10:58:51,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:51,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:51,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:51,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 10:58:51,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +48: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 10:58:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 10:58:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 10:58:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 10:58:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 10:58:52,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 10:58:52,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 10:58:52,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 10:58:52,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 10:58:52,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +20: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 10:58:52,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 10:58:52,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 10:58:52,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 10:58:52,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:52,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +46: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +46: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +46: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +20: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:52,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +17: [2023-04-29 10:58:52,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +23: [2023-04-29 10:58:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:52,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +23: [2023-04-29 10:58:52,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 10:58:52,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 10:58:52,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 10:58:52,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 10:58:52,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 10:58:52,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 10:58:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 10:58:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:52,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 10:58:52,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 10:58:52,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 10:58:52,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 10:58:52,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 10:58:52,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:52,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 10:58:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 10:58:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 10:58:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 10:58:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +37: [2023-04-29 10:58:52,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:52,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +37: [2023-04-29 10:58:52,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +50: [2023-04-29 10:58:52,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 10:58:52,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:52,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 10:58:52,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:52,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:52,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:52,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:52,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +49: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 10:58:52,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 10:58:52,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 10:58:52,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +57: [2023-04-29 10:58:52,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 10:58:52,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 10:58:52,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 10:58:52,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +38: [2023-04-29 10:58:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:52,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:52,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +31: [2023-04-29 10:58:52,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 10:58:52,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 10:58:52,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:52,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +61: [2023-04-29 10:58:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 10:58:52,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:52,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 10:58:52,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:52,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 10:58:52,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:52,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +20: [2023-04-29 10:58:52,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:52,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +63: [2023-04-29 10:58:52,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 10:58:52,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 10:58:52,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +48: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +20: [2023-04-29 10:58:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 10:58:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +12: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 10:58:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +20: [2023-04-29 10:58:52,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +30: [2023-04-29 10:58:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +20: [2023-04-29 10:58:52,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 10:58:52,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 10:58:52,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:52,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +38: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +22: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +35: [2023-04-29 10:58:52,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 10:58:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +45: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +40: [2023-04-29 10:58:52,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 10:58:52,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +12: [2023-04-29 10:58:52,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +21: [2023-04-29 10:58:52,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 10:58:52,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:52,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +27: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 10:58:52,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 10:58:52,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +32: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +27: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +27: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +48: [2023-04-29 10:58:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 10:58:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +48: [2023-04-29 10:58:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 10:58:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 10:58:52,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 10:58:52,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +24: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +32: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 10:58:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 10:58:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 10:58:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +24: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 10:58:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 10:58:52,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:52,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +46: [2023-04-29 10:58:52,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:52,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +39: [2023-04-29 10:58:52,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:52,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 10:58:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +48: [2023-04-29 10:58:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 10:58:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 10:58:52,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +46: [2023-04-29 10:58:52,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +29: [2023-04-29 10:58:52,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:52,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 10:58:52,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +39: [2023-04-29 10:58:52,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +39: [2023-04-29 10:58:52,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 10:58:52,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 10:58:52,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 10:58:52,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:52,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:52,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 10:58:52,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 10:58:52,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +35: [2023-04-29 10:58:52,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:52,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 10:58:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 10:58:52,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +57: [2023-04-29 10:58:52,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:52,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 10:58:52,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 10:58:52,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 10:58:52,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 10:58:52,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +58: [2023-04-29 10:58:52,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +58: [2023-04-29 10:58:52,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 10:58:52,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 10:58:52,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +58: [2023-04-29 10:58:52,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 10:58:52,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 10:58:52,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +35: [2023-04-29 10:58:52,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:52,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 10:58:52,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 10:58:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 10:58:52,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 10:58:52,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 10:58:52,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 10:58:52,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 10:58:52,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:52,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 10:58:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 10:58:52,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 10:58:52,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 10:58:52,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 10:58:52,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 10:58:52,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +50: [2023-04-29 10:58:52,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 10:58:52,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 10:58:52,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 10:58:52,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +45: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 10:58:52,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 10:58:52,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt... +12: [2023-04-29 10:58:52,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 10:58:52,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:52,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +15: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:52,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 10:58:52,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 10:58:52,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:52,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:52,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +29: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:52,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +28: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +15: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +15: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +62: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:52,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +16: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +16: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 10:58:52,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +12: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +32: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +56: [2023-04-29 10:58:52,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 10:58:52,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +45: [2023-04-29 10:58:52,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 10:58:52,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 10:58:52,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 10:58:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:52,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +26: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 10:58:52,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 10:58:52,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 10:58:52,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 10:58:52,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 10:58:52,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +13: [2023-04-29 10:58:52,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +32: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +24: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +34: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 10:58:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 10:58:52,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +47: [2023-04-29 10:58:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 10:58:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +26: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 10:58:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:52,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:52,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:52,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:52,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:52,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:52,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:52,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 10:58:52,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 10:58:52,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +12: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 10:58:52,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 10:58:52,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:52,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 10:58:52,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +11: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 10:58:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +42: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +14: [2023-04-29 10:58:52,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 10:58:52,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:52,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 10:58:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +19: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 10:58:52,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +19: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:52,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 10:58:52,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:52,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 10:58:52,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 10:58:52,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:52,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:52,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 10:58:52,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 10:58:52,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +60: [2023-04-29 10:58:52,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +60: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +10: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 10:58:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 10:58:52,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:52,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 10:58:52,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +52: [2023-04-29 10:58:52,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +29: [2023-04-29 10:58:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +24: [2023-04-29 10:58:52,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 10:58:52,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +18: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +43: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +59: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 10:58:52,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:52,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +51: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 10:58:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +53: [2023-04-29 10:58:52,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 10:58:52,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 10:58:52,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 10:58:52,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +32: [2023-04-29 10:58:52,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:52,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 10:58:52,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +57: [2023-04-29 10:58:52,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +52: [2023-04-29 10:58:52,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:52,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 10:58:52,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 10:58:52,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:52,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:52,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:52,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 10:58:52,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 10:58:52,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 10:58:52,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 10:58:52,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:52,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 10:58:52,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 10:58:52,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:52,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +53: [2023-04-29 10:58:52,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:52,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 10:58:52,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 10:58:52,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 10:58:52,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 10:58:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +50: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:52,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +62: [2023-04-29 10:58:52,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +50: [2023-04-29 10:58:52,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 10:58:52,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:52,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 10:58:52,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 10:58:52,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 10:58:52,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +62: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +56: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +58: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 6: [2023-04-29 10:58:52,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 10:58:52,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 6: [2023-04-29 10:58:52,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +44: [2023-04-29 10:58:52,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:52,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 4: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 6: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +62: [2023-04-29 10:58:52,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:52,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 10:58:52,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +36: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:52,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:52,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +14: [2023-04-29 10:58:52,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 10:58:52,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 10:58:52,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 10:58:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 10:58:52,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 10:58:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 10:58:52,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 10:58:52,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 10:58:52,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 1: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 10:58:52,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:52,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:52,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +15: [2023-04-29 10:58:52,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 10:58:52,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 10:58:52,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 10:58:52,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:52,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:52,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 10:58:52,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 10:58:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 10:58:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 10:58:52,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 10:58:52,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:52,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +47: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +14: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:52,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:52,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 10:58:52,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 10:58:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:52,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:52,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:52,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:52,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 10:58:52,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:52,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:52,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 10:58:52,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +32: [2023-04-29 10:58:52,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:52,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +34: [2023-04-29 10:58:52,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 10:58:52,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:52,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 10:58:52,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 10:58:52,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:52,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 10:58:52,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 10:58:52,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 10:58:52,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +52: [2023-04-29 10:58:52,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:52,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +19: [2023-04-29 10:58:52,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 10:58:52,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 10:58:52,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +34: [2023-04-29 10:58:52,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 10:58:52,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +47: [2023-04-29 10:58:52,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +52: [2023-04-29 10:58:52,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 10:58:52,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:52,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:52,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 10:58:52,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:52,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 10:58:52,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:52,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:52,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 10:58:52,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 10:58:52,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:52,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:52,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 10:58:52,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 10:58:52,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 10:58:52,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +59: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +18: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 10:58:52,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 10:58:52,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:52,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +60: [2023-04-29 10:58:52,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +18: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +52: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 10:58:52,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 10:58:52,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 10:58:52,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 10:58:52,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:52,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +36: [2023-04-29 10:58:52,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:52,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +32: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 6: [2023-04-29 10:58:52,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +37: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 10:58:52,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 10:58:52,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 10:58:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 10:58:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 10:58:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 10:58:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 10:58:52,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 10:58:52,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 10:58:52,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 10:58:52,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:52,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:52,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:52,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:52,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:52,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:52,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 10:58:52,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:52,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 10:58:52,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +59: [2023-04-29 10:58:52,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 10:58:52,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 10:58:52,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 10:58:52,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 10:58:52,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:52,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 10:58:52,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 10:58:52,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 1: [2023-04-29 10:58:52,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 10:58:52,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 10:58:52,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 10:58:52,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +37: [2023-04-29 10:58:52,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 10:58:52,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 10:58:52,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +37: [2023-04-29 10:58:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 10:58:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 10:58:52,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:52,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 10:58:52,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 10:58:52,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 10:58:52,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:52,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:52,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:52,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:52,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:52,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:52,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 10:58:52,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 10:58:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +50: [2023-04-29 10:58:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:52,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:52,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 10:58:52,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:52,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:52,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:52,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +36: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 10:58:52,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:52,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 10:58:52,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 10:58:52,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +42: [2023-04-29 10:58:52,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 10:58:52,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 10:58:52,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 10:58:52,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 10:58:52,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 10:58:52,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 10:58:52,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 10:58:52,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 10:58:52,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 10:58:52,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 10:58:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +10: [2023-04-29 10:58:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 10:58:52,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 10:58:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +10: [2023-04-29 10:58:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +47: [2023-04-29 10:58:52,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +49: [2023-04-29 10:58:52,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 10:58:52,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 10:58:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 10:58:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 10:58:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +36: [2023-04-29 10:58:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +57: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 10:58:52,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 8: [2023-04-29 10:58:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 10:58:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +33: [2023-04-29 10:58:52,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 10:58:52,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 10:58:52,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 10:58:52,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 10:58:52,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 10:58:52,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 10:58:52,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:52,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 10:58:52,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 10:58:52,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:52,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 10:58:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 10:58:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 10:58:52,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:52,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 10:58:52,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 10:58:52,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 10:58:52,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 10:58:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +37: [2023-04-29 10:58:52,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 10:58:52,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:52,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:52,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 10:58:52,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 10:58:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 10:58:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 10:58:52,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +37: [2023-04-29 10:58:52,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 10:58:52,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 10:58:52,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:52,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 10:58:52,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +40: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +23: [2023-04-29 10:58:52,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 10:58:52,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +32: [2023-04-29 10:58:52,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 10:58:52,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 10:58:52,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 10:58:52,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 10:58:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +63: [2023-04-29 10:58:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 10:58:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 10:58:52,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:52,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 10:58:52,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 10:58:52,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 10:58:52,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +63: [2023-04-29 10:58:52,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:52,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 10:58:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 10:58:52,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +63: [2023-04-29 10:58:52,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +63: [2023-04-29 10:58:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +63: [2023-04-29 10:58:52,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +17: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 10:58:52,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 10:58:52,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +50: [2023-04-29 10:58:52,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 10:58:52,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +23: [2023-04-29 10:58:52,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +56: [2023-04-29 10:58:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:52,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +63: [2023-04-29 10:58:52,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:52,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +51: [2023-04-29 10:58:52,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +51: [2023-04-29 10:58:52,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. +51: [2023-04-29 10:58:52,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:52,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 10:58:52,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:52,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 10:58:52,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +35: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +25: [2023-04-29 10:58:52,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +25: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 10:58:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 10:58:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 10:58:52,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +45: [2023-04-29 10:58:52,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:52,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +40: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +35: [2023-04-29 10:58:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 10:58:52,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 10:58:52,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +58: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +31: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +17: [2023-04-29 10:58:52,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 10:58:52,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 10:58:52,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 10:58:52,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:52,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 10:58:52,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +25: [2023-04-29 10:58:52,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +54: [2023-04-29 10:58:52,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 10:58:52,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 10:58:52,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:52,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 10:58:52,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:52,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +55: [2023-04-29 10:58:52,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:52,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 10:58:52,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 10:58:52,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:52,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:52,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:52,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 10:58:52,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 10:58:52,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 10:58:52,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 10:58:52,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 10:58:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 10:58:52,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:52,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:52,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +15: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +15: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +15: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +33: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +25: [2023-04-29 10:58:52,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 10:58:52,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +61: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 10:58:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +47: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 10:58:52,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +35: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 10:58:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +44: [2023-04-29 10:58:52,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +45: [2023-04-29 10:58:52,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +45: [2023-04-29 10:58:52,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +61: [2023-04-29 10:58:52,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 10:58:52,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +61: [2023-04-29 10:58:52,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 10:58:52,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 10:58:52,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:52,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 10:58:52,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:52,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:52,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:52,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:52,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 10:58:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 10:58:52,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 10:58:52,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:52,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +49: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:52,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +20: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 10:58:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:52,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 10:58:52,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 10:58:52,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 10:58:52,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +44: [2023-04-29 10:58:52,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +46: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 10:58:52,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:52,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:52,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 10:58:52,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:52,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 10:58:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:52,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 10:58:52,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 10:58:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +15: [2023-04-29 10:58:52,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 10:58:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 10:58:52,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 10:58:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 10:58:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 10:58:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:52,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 10:58:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 10:58:52,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 10:58:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 10:58:52,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 10:58:52,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 10:58:52,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 10:58:52,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:52,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 10:58:52,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:52,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:52,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +24: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 10:58:52,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 10:58:52,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 4: [2023-04-29 10:58:52,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +63: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 10:58:52,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +41: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +41: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +24: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 10:58:52,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 10:58:52,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 10:58:52,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:52,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +25: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 10:58:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 10:58:52,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:52,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 10:58:52,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 10:58:52,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +55: [2023-04-29 10:58:52,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 10:58:52,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:52,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:52,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 10:58:52,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 10:58:52,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +31: [2023-04-29 10:58:52,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +55: [2023-04-29 10:58:52,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:52,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +35: [2023-04-29 10:58:52,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +55: [2023-04-29 10:58:52,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +51: [2023-04-29 10:58:52,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +43: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +58: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +61: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 10:58:52,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:52,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 10:58:52,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +45: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +22: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +45: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 10:58:52,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 10:58:52,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:52,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +61: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 10:58:52,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 10:58:52,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 10:58:52,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:52,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 10:58:52,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 10:58:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +47: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +31: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +53: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 10:58:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 10:58:52,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 10:58:52,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:52,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 8: [2023-04-29 10:58:52,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +39: [2023-04-29 10:58:52,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:52,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +21: [2023-04-29 10:58:52,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +47: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 10:58:52,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 10:58:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +25: [2023-04-29 10:58:52,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:52,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:52,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 10:58:52,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 10:58:52,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +20: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +20: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +20: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +20: [2023-04-29 10:58:52,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +34: [2023-04-29 10:58:52,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 10:58:52,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +57: [2023-04-29 10:58:52,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:52,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 10:58:52,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 10:58:52,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 10:58:52,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 10:58:52,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 10:58:52,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 10:58:52,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:52,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:52,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:52,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:52,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 10:58:52,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:52,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 10:58:52,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 5: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 10:58:52,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 10:58:52,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 10:58:52,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 10:58:52,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 10:58:52,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:52,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:52,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:52,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 10:58:52,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 10:58:52,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +42: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +22: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +59: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +22: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:52,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 10:58:52,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:52,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:52,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 10:58:52,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:52,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +22: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 10:58:52,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +37: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 10:58:52,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +22: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 10:58:52,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 10:58:52,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:52,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 10:58:52,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 10:58:52,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +38: [2023-04-29 10:58:52,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:52,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +27: [2023-04-29 10:58:52,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 10:58:52,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 10:58:52,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +49: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:52,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:52,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:52,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +19: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +46: [2023-04-29 10:58:52,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 10:58:52,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 4: [2023-04-29 10:58:52,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 10:58:52,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +11: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +19: [2023-04-29 10:58:52,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:52,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 10:58:52,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 10:58:52,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:52,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +21: [2023-04-29 10:58:52,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 10:58:52,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +44: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:52,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +32: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +43: [2023-04-29 10:58:52,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt... +32: [2023-04-29 10:58:52,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 10:58:52,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 10:58:52,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 10:58:52,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:52,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 10:58:52,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 10:58:52,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:52,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:52,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:52,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 10:58:52,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 10:58:52,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 10:58:52,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:52,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:52,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 10:58:52,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 10:58:52,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 10:58:52,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +36: [2023-04-29 10:58:52,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 10:58:52,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:52,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 10:58:52,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:52,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:52,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:52,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 10:58:52,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 10:58:52,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 10:58:52,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +17: [2023-04-29 10:58:52,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 10:58:52,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:52,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 10:58:52,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 10:58:52,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:52,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:52,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:52,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 10:58:52,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +57: [2023-04-29 10:58:52,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 10:58:52,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 10:58:52,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 10:58:52,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:52,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 10:58:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 10:58:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +30: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:52,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 10:58:52,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 10:58:52,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 10:58:52,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +61: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +17: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +45: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +59: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +58: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 3: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 10:58:52,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +12: [2023-04-29 10:58:52,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +62: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +30: [2023-04-29 10:58:52,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +27: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 10:58:52,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 10:58:52,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:52,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:52,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +41: [2023-04-29 10:58:52,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +22: [2023-04-29 10:58:52,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 10:58:52,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 10:58:52,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 10:58:52,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +18: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +61: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +43: [2023-04-29 10:58:52,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +53: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +53: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +28: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +46: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 10:58:52,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 10:58:52,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 10:58:52,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +59: [2023-04-29 10:58:52,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +22: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +18: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 10:58:52,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 10:58:52,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +29: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 10:58:52,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +43: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +43: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 10:58:52,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 10:58:52,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +57: [2023-04-29 10:58:52,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 10:58:52,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 10:58:52,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 10:58:52,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +22: [2023-04-29 10:58:52,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 10:58:52,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 10:58:52,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 10:58:52,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 10:58:52,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 10:58:52,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +20: [2023-04-29 10:58:52,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:52,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 10:58:52,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +20: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 10:58:52,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:52,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +29: [2023-04-29 10:58:52,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 10:58:52,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 10:58:52,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:52,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 10:58:52,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 10:58:52,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 10:58:52,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +22: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:52,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 10:58:52,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +37: [2023-04-29 10:58:52,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +20: [2023-04-29 10:58:52,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 10:58:52,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +20: [2023-04-29 10:58:52,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +62: [2023-04-29 10:58:52,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +27: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:52,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +26: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +27: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 10:58:52,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +31: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +16: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +31: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +42: [2023-04-29 10:58:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 10:58:52,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 10:58:52,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +42: [2023-04-29 10:58:52,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:52,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 10:58:52,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 10:58:52,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:52,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 10:58:52,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 10:58:52,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +36: [2023-04-29 10:58:52,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 2: [2023-04-29 10:58:52,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 10:58:52,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +36: [2023-04-29 10:58:52,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +53: [2023-04-29 10:58:52,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 10:58:52,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 10:58:52,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 10:58:52,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:52,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:52,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 10:58:52,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 10:58:52,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 10:58:52,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:52,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 10:58:52,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 10:58:52,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:52,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 10:58:52,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 10:58:52,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +15: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +15: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +55: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 10:58:52,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +11: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +62: [2023-04-29 10:58:52,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +11: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +31: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:52,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +40: [2023-04-29 10:58:52,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 10:58:52,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:52,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 10:58:52,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:52,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:52,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +31: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +24: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +52: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 10:58:52,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 10:58:52,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:52,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 10:58:52,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +16: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +56: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:52,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +16: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +33: [2023-04-29 10:58:52,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +29: [2023-04-29 10:58:52,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +36: [2023-04-29 10:58:52,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 10:58:52,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 10:58:52,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:52,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:52,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 10:58:52,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 10:58:52,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +19: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +23: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 0: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +11: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 10:58:52,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 10:58:52,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:52,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 10:58:52,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 3: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:52,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +12: [2023-04-29 10:58:52,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 10:58:52,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 10:58:52,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:52,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 10:58:52,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 10:58:52,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:52,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 10:58:52,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 10:58:52,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +40: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 10:58:52,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +10: [2023-04-29 10:58:52,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 10:58:52,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 10:58:52,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:52,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:52,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 10:58:52,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 10:58:52,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:52,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:52,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 10:58:52,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 10:58:52,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +27: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +36: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +12: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:52,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +30: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 10:58:52,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:52,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 10:58:52,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:52,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:52,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 10:58:52,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:52,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +33: [2023-04-29 10:58:52,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +49: [2023-04-29 10:58:52,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 10:58:52,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +23: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +23: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 10:58:52,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +26: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +26: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 10:58:52,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 10:58:52,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 10:58:52,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +27: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +18: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +57: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:52,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 10:58:52,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +15: [2023-04-29 10:58:52,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:52,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +37: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +37: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +37: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +13: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +47: [2023-04-29 10:58:52,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +13: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 7: [2023-04-29 10:58:52,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +15: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:52,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 10:58:52,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:52,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:52,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:52,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +48: [2023-04-29 10:58:52,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 1: [2023-04-29 10:58:52,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:52,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +47: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +53: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 10:58:52,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:52,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 10:58:52,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 1: [2023-04-29 10:58:52,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:52,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +13: [2023-04-29 10:58:52,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:52,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +35: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +13: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +13: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 10:58:52,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +45: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +28: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +16: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +35: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 10:58:52,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +52: [2023-04-29 10:58:52,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 10:58:52,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 10:58:52,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +53: [2023-04-29 10:58:52,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +53: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +31: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 10:58:52,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +25: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +35: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:52,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 10:58:52,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +45: [2023-04-29 10:58:52,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:52,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +51: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +30: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +35: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +51: [2023-04-29 10:58:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +18: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +18: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +34: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +34: [2023-04-29 10:58:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +34: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +26: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 10:58:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +34: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +14: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 10:58:52,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:52,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 8: [2023-04-29 10:58:52,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 10:58:52,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +51: [2023-04-29 10:58:52,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +51: [2023-04-29 10:58:52,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +51: [2023-04-29 10:58:52,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 10:58:52,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:52,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 10:58:52,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 10:58:52,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:52,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +30: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +49: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:52,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +11: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +34: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. + 2: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:52,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 10:58:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 10:58:52,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 10:58:52,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +33: [2023-04-29 10:58:52,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +37: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 10:58:52,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 10:58:52,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 10:58:52,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 10:58:52,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:52,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +11: [2023-04-29 10:58:52,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +58: [2023-04-29 10:58:52,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 10:58:52,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 10:58:52,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 10:58:52,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +13: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +52: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 10:58:52,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 5: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +13: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +26: [2023-04-29 10:58:52,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:52,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:52,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 10:58:52,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:52,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 10:58:52,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:52,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 10:58:52,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 10:58:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 10:58:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 10:58:52,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:52,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:52,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:52,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +15: [2023-04-29 10:58:52,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:52,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +50: [2023-04-29 10:58:52,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 10:58:52,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:52,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:52,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:52,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 10:58:52,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +18: [2023-04-29 10:58:52,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 10:58:52,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 0: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 10:58:52,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 10:58:52,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 10:58:52,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 10:58:52,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 10:58:52,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 10:58:52,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +34: [2023-04-29 10:58:52,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 10:58:52,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 10:58:52,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:52,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:52,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:52,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:52,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +18: [2023-04-29 10:58:52,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:52,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... + 8: [2023-04-29 10:58:52,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:52,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:52,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 10:58:52,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 10:58:52,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 10:58:52,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 10:58:52,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 10:58:52,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 10:58:52,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:52,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 10:58:52,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 10:58:52,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:52,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +40: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +40: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:52,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +24: [2023-04-29 10:58:52,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:52,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +40: [2023-04-29 10:58:52,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt. +34: [2023-04-29 10:58:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 10:58:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +10: [2023-04-29 10:58:52,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 10:58:52,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:52,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +29: [2023-04-29 10:58:52,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 10:58:52,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 10:58:52,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 10:58:52,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +36: [2023-04-29 10:58:52,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 10:58:52,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +10: [2023-04-29 10:58:52,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 10:58:52,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:52,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:52,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +29: [2023-04-29 10:58:52,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 10:58:52,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 10:58:52,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:52,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:52,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 10:58:52,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +14: [2023-04-29 10:58:52,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:52,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:52,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 10:58:52,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 10:58:52,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:52,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 10:58:52,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 10:58:52,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 10:58:52,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +10: [2023-04-29 10:58:52,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 10:58:52,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +60: [2023-04-29 10:58:52,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +63: [2023-04-29 10:58:52,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:52,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:52,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:52,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:52,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:52,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:52,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:52,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 10:58:52,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:52,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 10:58:52,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:52,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:52,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:52,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:52,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 10:58:52,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +16: [2023-04-29 10:58:52,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +16: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +45: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +47: [2023-04-29 10:58:52,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:52,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 10:58:52,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 10:58:52,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +10: [2023-04-29 10:58:52,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:52,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 10:58:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:52,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 10:58:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 10:58:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:52,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +35: [2023-04-29 10:58:52,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +26: [2023-04-29 10:58:52,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:52,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +34: [2023-04-29 10:58:52,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:52,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +26: [2023-04-29 10:58:52,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +10: [2023-04-29 10:58:52,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 10:58:52,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +47: [2023-04-29 10:58:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 10:58:52,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 10:58:52,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 10:58:52,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:52,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:52,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 10:58:52,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 10:58:52,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:52,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 10:58:52,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 10:58:52,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 10:58:52,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +14: [2023-04-29 10:58:52,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:52,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 10:58:52,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 10:58:52,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 10:58:52,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:52,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:52,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +37: [2023-04-29 10:58:52,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 10:58:52,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:52,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:52,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +52: [2023-04-29 10:58:52,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:52,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:52,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +54: [2023-04-29 10:58:52,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:52,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 10:58:52,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +54: [2023-04-29 10:58:52,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:52,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 10:58:52,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:52,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 10:58:52,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +13: [2023-04-29 10:58:52,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 10:58:52,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:52,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:52,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +47: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 10:58:52,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:52,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 10:58:52,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:52,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 10:58:52,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:52,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:52,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 10:58:52,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 10:58:52,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +18: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:52,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:52,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:52,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +44: [2023-04-29 10:58:52,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:52,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 10:58:52,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:52,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 10:58:52,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 10:58:52,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 10:58:52,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 10:58:52,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:52,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:52,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:52,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:52,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 10:58:52,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:52,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:52,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:52,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:52,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 10:58:52,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:52,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 10:58:52,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:52,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:52,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:52,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:52,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:52,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +34: [2023-04-29 10:58:52,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 10:58:52,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:52,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:52,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 10:58:52,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:52,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 10:58:52,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:52,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 10:58:52,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +14: [2023-04-29 10:58:52,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 10:58:52,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:52,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 10:58:52,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 10:58:52,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 10:58:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 10:58:52,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 10:58:52,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 10:58:52,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 10:58:52,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +19: [2023-04-29 10:58:52,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 10:58:52,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:52,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:52,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 10:58:52,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 10:58:52,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +59: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +59: [2023-04-29 10:58:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 10:58:52,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +59: [2023-04-29 10:58:52,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:52,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +34: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 10:58:52,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 10:58:52,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 10:58:52,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +63: [2023-04-29 10:58:52,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:52,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:52,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:52,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 10:58:52,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +23: [2023-04-29 10:58:52,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 10:58:52,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 10:58:52,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +14: [2023-04-29 10:58:52,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 10:58:52,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 10:58:52,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 10:58:52,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 10:58:52,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:52,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:52,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +13: [2023-04-29 10:58:52,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 10:58:52,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 10:58:52,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:52,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:52,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 10:58:52,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 10:58:52,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 10:58:52,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +14: [2023-04-29 10:58:52,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +14: [2023-04-29 10:58:52,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 10:58:52,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 10:58:52,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 10:58:52,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 10:58:52,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +40: [2023-04-29 10:58:52,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 10:58:52,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 10:58:52,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt. +14: [2023-04-29 10:58:52,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +14: [2023-04-29 10:58:52,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 10:58:52,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 10:58:52,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 10:58:52,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 10:58:52,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 10:58:52,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:52,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:52,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 10:58:52,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +13: [2023-04-29 10:58:52,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 10:58:52,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 10:58:52,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:52,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:52,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:52,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:52,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +20: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +20: [2023-04-29 10:58:52,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +20: [2023-04-29 10:58:52,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +47: [2023-04-29 10:58:52,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 10:58:52,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 10:58:52,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:52,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 10:58:52,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 10:58:52,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:52,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:52,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 10:58:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 10:58:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 10:58:52,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 10:58:52,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 10:58:52,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:52,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:52,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:52,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:52,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:52,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:52,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:52,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 10:58:52,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:52,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 10:58:52,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:52,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:52,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:52,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:52,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 10:58:52,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 10:58:52,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 10:58:52,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +32: [2023-04-29 10:58:52,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +32: [2023-04-29 10:58:52,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 10:58:52,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +47: [2023-04-29 10:58:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:52,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:52,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:52,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 10:58:52,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:52,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:52,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:52,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:52,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:52,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:52,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:52,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 10:58:52,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 10:58:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:52,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:52,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:53,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:53,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 2: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 2: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +40: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:53,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +54: [2023-04-29 10:58:53,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:53,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:53,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:53,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:53,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:53,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 10:58:53,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 10:58:53,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:53,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 10:58:53,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:53,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 10:58:53,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 10:58:53,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 10:58:53,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:53,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:53,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:53,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:53,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:53,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 10:58:53,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:53,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:53,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:53,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 10:58:53,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 10:58:53,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:53,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:53,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:53,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:53,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:53,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +43: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +43: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 10:58:53,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 10:58:53,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 10:58:53,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:53,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:53,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:53,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 10:58:53,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:53,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:53,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:53,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:53,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 10:58:53,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 10:58:53,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:53,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 10:58:53,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 10:58:53,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 10:58:53,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 6: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +36: [2023-04-29 10:58:53,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 10:58:53,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +36: [2023-04-29 10:58:53,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 10:58:53,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:53,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 10:58:53,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:53,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 10:58:53,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:53,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. + 6: [2023-04-29 10:58:53,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 10:58:53,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:53,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:53,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 10:58:53,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:53,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 10:58:53,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 10:58:53,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:53,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:53,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 10:58:53,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:53,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:53,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:53,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:53,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +49: [2023-04-29 10:58:53,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 10:58:53,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 10:58:53,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 10:58:53,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +59: [2023-04-29 10:58:53,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 7: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +49: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 7: [2023-04-29 10:58:53,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +53: [2023-04-29 10:58:53,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 10:58:53,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 10:58:53,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 10:58:53,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 10:58:53,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +36: [2023-04-29 10:58:53,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 10:58:53,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:53,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:53,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:53,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +11: [2023-04-29 10:58:53,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +49: [2023-04-29 10:58:53,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:53,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +59: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:53,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 10:58:53,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +40: [2023-04-29 10:58:53,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 10:58:53,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +24: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +42: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +24: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +52: [2023-04-29 10:58:53,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 10:58:53,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +55: [2023-04-29 10:58:53,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:53,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +31: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +46: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:53,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 10:58:53,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 10:58:53,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 10:58:53,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 10:58:53,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 10:58:53,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 10:58:53,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 10:58:53,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +32: [2023-04-29 10:58:53,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:53,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:53,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 10:58:53,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 10:58:53,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 10:58:53,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 10:58:53,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:53,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 10:58:53,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:53,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:53,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 10:58:53,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +21: [2023-04-29 10:58:53,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:53,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 10:58:53,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +21: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:53,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +30: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 10:58:53,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +50: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +11: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 10:58:53,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:53,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 10:58:53,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:53,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 10:58:53,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 10:58:53,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 10:58:53,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 10:58:53,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 10:58:53,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:53,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:53,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 10:58:53,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:53,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:53,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:53,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 10:58:53,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +45: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 10:58:53,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:53,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 10:58:53,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:53,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 10:58:53,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:53,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 10:58:53,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:53,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 10:58:53,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 10:58:53,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:53,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 10:58:53,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 10:58:53,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +16: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +16: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +38: [2023-04-29 10:58:53,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +48: [2023-04-29 10:58:53,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:53,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 10:58:53,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +36: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:53,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:53,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +39: [2023-04-29 10:58:53,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:53,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 10:58:53,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 10:58:53,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +29: [2023-04-29 10:58:53,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 10:58:53,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:53,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 10:58:53,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:53,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 10:58:53,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:53,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 10:58:53,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 10:58:53,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:53,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 10:58:53,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 10:58:53,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 10:58:53,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +49: [2023-04-29 10:58:53,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:53,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +34: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +26: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +26: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +26: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +26: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +25: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 10:58:53,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 10:58:53,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +16: [2023-04-29 10:58:53,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:53,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 10:58:53,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:53,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 10:58:53,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:53,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:53,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 10:58:53,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 10:58:53,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:53,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:53,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 10:58:53,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:53,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:53,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 10:58:53,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 10:58:53,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +25: [2023-04-29 10:58:53,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +25: [2023-04-29 10:58:53,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:53,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +25: [2023-04-29 10:58:53,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 10:58:53,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 10:58:53,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:53,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:53,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:53,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:53,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:53,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 10:58:53,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:53,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 10:58:53,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:53,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 10:58:53,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 10:58:53,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 10:58:53,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 10:58:53,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 10:58:53,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 10:58:53,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +53: [2023-04-29 10:58:53,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 10:58:53,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 10:58:53,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 10:58:53,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:53,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +26: [2023-04-29 10:58:53,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:53,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +40: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +40: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +40: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:53,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +51: [2023-04-29 10:58:53,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +34: [2023-04-29 10:58:53,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 10:58:53,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:53,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:53,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 10:58:53,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 10:58:53,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 10:58:53,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +51: [2023-04-29 10:58:53,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 10:58:53,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:53,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 10:58:53,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:53,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +31: [2023-04-29 10:58:53,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +31: [2023-04-29 10:58:53,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +31: [2023-04-29 10:58:53,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 10:58:53,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 10:58:53,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 10:58:53,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 10:58:53,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 10:58:53,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +36: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 10:58:53,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +28: [2023-04-29 10:58:53,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:53,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:53,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:53,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:53,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:53,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 10:58:53,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:53,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:53,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:53,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +40: [2023-04-29 10:58:53,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 10:58:53,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 10:58:53,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 10:58:53,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 10:58:53,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:53,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:53,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 10:58:53,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 10:58:53,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:53,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 10:58:53,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:53,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:53,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 10:58:53,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 10:58:53,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:53,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 10:58:53,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 10:58:53,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:53,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:53,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 10:58:53,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +44: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +41: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 10:58:53,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 10:58:53,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:53,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 10:58:53,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 10:58:53,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 10:58:53,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +31: [2023-04-29 10:58:53,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:53,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +10: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +34: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +14: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +32: [2023-04-29 10:58:53,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +32: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 0: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 0: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +34: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +32: [2023-04-29 10:58:53,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +32: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +49: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 10:58:53,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:53,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:53,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +31: [2023-04-29 10:58:53,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 10:58:53,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 10:58:53,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:53,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 10:58:53,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +62: [2023-04-29 10:58:53,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +20: [2023-04-29 10:58:53,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 10:58:53,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 10:58:53,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 8: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 10:58:53,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 10:58:53,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +62: [2023-04-29 10:58:53,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 10:58:53,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 10:58:53,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 10:58:53,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 10:58:53,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 10:58:53,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +13: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +13: [2023-04-29 10:58:53,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +13: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +13: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +33: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:53,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +34: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +40: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 10:58:53,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 10:58:53,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 10:58:53,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 10:58:53,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +31: [2023-04-29 10:58:53,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:53,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 10:58:53,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 10:58:53,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:53,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 10:58:53,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 10:58:53,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 10:58:53,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:53,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 10:58:53,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 10:58:53,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:53,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:53,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:53,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 10:58:53,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 10:58:53,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:53,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +62: [2023-04-29 10:58:53,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:53,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 10:58:53,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 10:58:53,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 10:58:53,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:53,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 10:58:53,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 10:58:53,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:53,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:53,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 10:58:53,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +51: [2023-04-29 10:58:53,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 10:58:53,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +53: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 10:58:53,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +13: [2023-04-29 10:58:53,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:53,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:53,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +13: [2023-04-29 10:58:53,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:53,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 10:58:53,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:53,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:53,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:53,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:53,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 10:58:53,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:53,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 10:58:53,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:53,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 10:58:53,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +49: [2023-04-29 10:58:53,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +20: [2023-04-29 10:58:53,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 10:58:53,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:53,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:53,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 10:58:53,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:53,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:53,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +49: [2023-04-29 10:58:53,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 10:58:53,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:53,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 10:58:53,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 10:58:53,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:53,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 10:58:53,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:53,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 10:58:53,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:53,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 10:58:53,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:53,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 10:58:53,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 10:58:53,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 10:58:53,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +17: [2023-04-29 10:58:53,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 10:58:53,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 10:58:53,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +35: [2023-04-29 10:58:53,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 10:58:53,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 10:58:53,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +10: [2023-04-29 10:58:53,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 10:58:53,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:53,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:53,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 10:58:53,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 10:58:53,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 10:58:53,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +10: [2023-04-29 10:58:53,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +39: [2023-04-29 10:58:53,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:53,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 10:58:53,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 10:58:53,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +44: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +63: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 9: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +44: [2023-04-29 10:58:53,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +12: [2023-04-29 10:58:53,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +55: [2023-04-29 10:58:53,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:53,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:53,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +55: [2023-04-29 10:58:53,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:53,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +11: [2023-04-29 10:58:53,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:53,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 10:58:53,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 10:58:53,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +55: [2023-04-29 10:58:53,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 0: [2023-04-29 10:58:53,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 1: [2023-04-29 10:58:53,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 10:58:53,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:53,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 2: [2023-04-29 10:58:53,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 10:58:53,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:53,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 2: [2023-04-29 10:58:53,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +35: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +35: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +35: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:53,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 10:58:53,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:53,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:53,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +58: [2023-04-29 10:58:53,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +58: [2023-04-29 10:58:53,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +24: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +43: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:53,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 10:58:53,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +11: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 10:58:53,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 10:58:53,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +12: [2023-04-29 10:58:53,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 10:58:53,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +18: [2023-04-29 10:58:53,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +63: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +12: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 10:58:53,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +11: [2023-04-29 10:58:53,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +54: [2023-04-29 10:58:53,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 10:58:53,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 10:58:53,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 10:58:53,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +30: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +21: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +54: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +21: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:53,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 10:58:53,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 10:58:53,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +15: [2023-04-29 10:58:53,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +21: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +29: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +30: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +42: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +42: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +21: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +58: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +21: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:53,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 10:58:53,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 10:58:53,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:53,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 10:58:53,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 10:58:53,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 10:58:53,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +58: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +58: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +50: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 10:58:53,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 10:58:53,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:53,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +19: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +28: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 10:58:53,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +14: [2023-04-29 10:58:53,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 10:58:53,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 10:58:53,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:53,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 10:58:53,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +28: [2023-04-29 10:58:53,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 10:58:53,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 7: [2023-04-29 10:58:53,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 10:58:53,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 10:58:53,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:53,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +39: [2023-04-29 10:58:53,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:53,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:53,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +57: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 10:58:53,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:53,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 7: [2023-04-29 10:58:53,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +22: [2023-04-29 10:58:53,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 10:58:53,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 10:58:53,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 10:58:53,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:53,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 10:58:53,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 10:58:53,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 10:58:53,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:53,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:53,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 10:58:53,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 10:58:53,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 10:58:53,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:53,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 10:58:53,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 10:58:53,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:53,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:53,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:53,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:53,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 10:58:53,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 10:58:53,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 10:58:53,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 10:58:53,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:53,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 10:58:53,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 10:58:53,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +27: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +27: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +27: [2023-04-29 10:58:53,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +27: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:53,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 10:58:53,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 10:58:53,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:53,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 5: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 5: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 10:58:53,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 10:58:53,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:53,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 10:58:53,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +18: [2023-04-29 10:58:53,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 10:58:53,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:53,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 10:58:53,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +39: [2023-04-29 10:58:53,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 10:58:53,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:53,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +13: [2023-04-29 10:58:53,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 10:58:53,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 10:58:53,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:53,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +13: [2023-04-29 10:58:53,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:53,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 10:58:53,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +13: [2023-04-29 10:58:53,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 10:58:53,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:53,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 10:58:53,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 10:58:53,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 10:58:53,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +59: [2023-04-29 10:58:53,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 10:58:53,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:53,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 10:58:53,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:53,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +12: [2023-04-29 10:58:53,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +58: [2023-04-29 10:58:53,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:53,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:53,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +50: [2023-04-29 10:58:53,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +21: [2023-04-29 10:58:53,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +30: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +30: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:53,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:53,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 10:58:53,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +50: [2023-04-29 10:58:53,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:53,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 10:58:53,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 7: [2023-04-29 10:58:53,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 10:58:53,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:53,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 7: [2023-04-29 10:58:53,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 10:58:53,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 10:58:53,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 10:58:53,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 10:58:53,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +28: [2023-04-29 10:58:53,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 10:58:53,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 10:58:53,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +30: [2023-04-29 10:58:53,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:53,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:53,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 10:58:53,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 10:58:53,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 10:58:53,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 10:58:53,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:53,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 10:58:53,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:53,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 10:58:53,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 10:58:53,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +42: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 10:58:53,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 10:58:53,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +37: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +37: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:53,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 10:58:53,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 10:58:53,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:53,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:53,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 10:58:53,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 10:58:53,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:53,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 10:58:53,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:53,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +26: [2023-04-29 10:58:53,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 7: [2023-04-29 10:58:53,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 10:58:53,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:53,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +33: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +33: [2023-04-29 10:58:53,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +26: [2023-04-29 10:58:53,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +26: [2023-04-29 10:58:53,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +10: [2023-04-29 10:58:53,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 10:58:53,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 10:58:53,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 10:58:53,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 10:58:53,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:53,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 10:58:53,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:53,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 10:58:53,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +46: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +46: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +46: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 7: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 5: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +61: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +16: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:53,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +12: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:53,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:53,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:53,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +41: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +41: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +41: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 2: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:53,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +16: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +33: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +16: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +13: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:53,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:53,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:53,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 10:58:53,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 10:58:53,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 10:58:53,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +27: [2023-04-29 10:58:53,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:53,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 10:58:53,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 10:58:53,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:53,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +13: [2023-04-29 10:58:53,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:53,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:53,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:53,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:53,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 10:58:53,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:53,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:53,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 10:58:53,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 10:58:53,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 10:58:53,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +13: [2023-04-29 10:58:53,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:53,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:53,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 10:58:53,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 10:58:53,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 10:58:53,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 10:58:53,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 10:58:53,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 10:58:53,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. +48: [2023-04-29 10:58:53,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +26: [2023-04-29 10:58:53,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 10:58:53,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 10:58:53,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 10:58:53,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 10:58:53,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +26: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +26: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:53,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 10:58:53,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 2: [2023-04-29 10:58:53,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 10:58:53,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 10:58:53,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 10:58:53,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 10:58:53,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 10:58:53,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 10:58:53,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 10:58:53,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 10:58:53,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 10:58:53,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 0: [2023-04-29 10:58:53,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:53,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 10:58:53,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 10:58:53,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +37: [2023-04-29 10:58:53,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:53,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 10:58:53,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 10:58:53,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:53,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 0: [2023-04-29 10:58:53,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 10:58:53,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +26: [2023-04-29 10:58:53,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 10:58:53,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 10:58:53,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 10:58:53,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 10:58:53,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 10:58:53,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 10:58:53,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 4: [2023-04-29 10:58:53,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 10:58:53,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 10:58:53,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 10:58:53,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 10:58:53,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +36: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +61: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 10:58:53,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +36: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +33: [2023-04-29 10:58:53,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:53,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +26: [2023-04-29 10:58:53,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 10:58:53,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 10:58:53,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:53,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +33: [2023-04-29 10:58:53,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 10:58:53,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 10:58:53,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:53,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:53,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 10:58:53,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 10:58:53,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 10:58:53,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:53,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +61: [2023-04-29 10:58:53,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 10:58:53,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 10:58:53,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:53,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 4: [2023-04-29 10:58:53,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 10:58:53,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 10:58:53,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:53,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 10:58:53,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:53,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +25: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +41: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +43: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 10:58:53,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 10:58:53,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:53,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 10:58:53,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:53,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +33: [2023-04-29 10:58:53,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 10:58:53,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:53,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +25: [2023-04-29 10:58:53,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 10:58:53,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 10:58:53,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:53,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:53,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 10:58:53,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 10:58:53,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 10:58:53,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:53,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 10:58:53,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:53,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:53,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:53,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 10:58:53,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:53,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:53,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 10:58:53,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +15: [2023-04-29 10:58:53,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +15: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 10:58:53,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:53,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:53,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:53,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 10:58:53,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:53,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:53,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:53,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:53,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:53,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:53,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:53,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:53,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 10:58:53,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:53,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:53,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:53,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 10:58:53,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 10:58:53,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 10:58:53,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +48: [2023-04-29 10:58:53,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:53,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 10:58:53,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 10:58:53,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +39: [2023-04-29 10:58:53,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +39: [2023-04-29 10:58:53,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 10:58:53,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... + 4: [2023-04-29 10:58:53,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 10:58:53,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:53,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:53,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 10:58:53,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 10:58:53,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:53,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 10:58:53,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +15: [2023-04-29 10:58:53,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 10:58:53,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 4: [2023-04-29 10:58:53,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +56: [2023-04-29 10:58:53,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 10:58:53,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +56: [2023-04-29 10:58:53,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 10:58:53,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:53,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 10:58:53,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt... +56: [2023-04-29 10:58:53,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 10:58:53,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:53,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 10:58:53,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 10:58:53,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:53,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:53,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +56: [2023-04-29 10:58:53,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 10:58:53,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 10:58:53,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:53,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:53,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 10:58:53,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:53,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +56: [2023-04-29 10:58:53,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 10:58:53,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 10:58:53,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 10:58:53,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 10:58:53,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 10:58:53,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 10:58:53,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 10:58:53,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 10:58:53,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +62: [2023-04-29 10:58:53,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +19: [2023-04-29 10:58:53,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +36: [2023-04-29 10:58:53,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 10:58:53,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +19: [2023-04-29 10:58:53,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:53,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 10:58:53,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:53,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 10:58:53,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:53,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 10:58:53,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 10:58:53,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +43: [2023-04-29 10:58:53,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +19: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +51: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 10:58:53,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +25: [2023-04-29 10:58:53,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +36: [2023-04-29 10:58:53,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +62: [2023-04-29 10:58:53,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:53,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 10:58:53,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 10:58:53,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:53,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:53,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +43: [2023-04-29 10:58:53,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:53,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +62: [2023-04-29 10:58:53,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:53,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +43: [2023-04-29 10:58:53,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 10:58:53,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 10:58:53,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 10:58:53,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 10:58:53,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 10:58:53,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 10:58:53,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +62: [2023-04-29 10:58:53,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +15: [2023-04-29 10:58:53,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 10:58:53,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 10:58:53,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:53,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:53,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 10:58:53,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:53,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 10:58:53,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 10:58:53,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:53,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 10:58:53,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 10:58:53,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 10:58:53,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:53,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 10:58:53,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:53,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:53,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:53,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:53,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:53,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 10:58:53,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:53,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 10:58:53,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:53,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:53,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 10:58:53,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:53,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:53,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:53,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:53,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 10:58:53,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 10:58:53,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:53,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:53,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:53,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:53,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:53,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 10:58:53,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 10:58:53,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 10:58:53,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 10:58:53,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 10:58:53,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 10:58:53,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 10:58:53,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 10:58:53,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:53,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:53,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:53,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:53,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:53,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 10:58:53,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 10:58:53,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:53,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +61: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:53,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:53,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 10:58:53,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 10:58:53,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:53,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 6: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 10:58:53,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 10:58:53,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 10:58:53,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:53,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:53,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 10:58:53,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:53,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:53,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:53,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 10:58:53,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:53,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 10:58:53,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 10:58:53,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +59: [2023-04-29 10:58:53,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +48: [2023-04-29 10:58:53,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +20: [2023-04-29 10:58:53,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 10:58:53,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 10:58:53,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. + 8: [2023-04-29 10:58:53,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 10:58:53,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 10:58:53,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 10:58:53,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:53,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 10:58:53,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 10:58:53,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:53,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:53,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 10:58:53,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:53,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:53,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:53,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:53,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:53,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:53,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:53,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 10:58:53,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 10:58:53,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 10:58:53,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:53,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 10:58:53,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 10:58:53,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 10:58:53,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 10:58:53,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +49: [2023-04-29 10:58:53,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:53,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +40: [2023-04-29 10:58:53,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +40: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +58: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:53,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +43: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +59: [2023-04-29 10:58:53,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +22: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +37: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 10:58:53,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +43: [2023-04-29 10:58:53,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 10:58:53,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 10:58:53,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 10:58:53,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:53,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:53,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:53,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:53,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +51: [2023-04-29 10:58:53,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +51: [2023-04-29 10:58:53,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:53,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:53,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 10:58:53,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +51: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +17: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +59: [2023-04-29 10:58:53,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:53,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 10:58:53,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 10:58:53,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 10:58:53,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:53,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 10:58:53,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:53,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 10:58:53,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 10:58:53,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +37: [2023-04-29 10:58:53,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 10:58:53,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +17: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:53,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:53,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 10:58:53,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +11: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:53,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:53,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:53,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +59: [2023-04-29 10:58:53,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +11: [2023-04-29 10:58:53,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 10:58:53,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +36: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:53,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 10:58:53,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +54: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:53,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:53,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +11: [2023-04-29 10:58:53,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:53,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 10:58:53,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +32: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +22: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 10:58:53,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +61: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:53,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:53,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:53,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 10:58:53,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:53,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +32: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:53,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 10:58:53,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 10:58:53,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +24: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 10:58:53,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:53,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 10:58:53,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 10:58:53,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 10:58:53,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:53,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 10:58:53,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 10:58:53,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 10:58:53,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 10:58:53,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 10:58:53,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:53,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 10:58:53,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 10:58:53,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:53,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:53,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 10:58:53,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +38: [2023-04-29 10:58:53,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +25: [2023-04-29 10:58:53,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:53,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:53,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:53,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 10:58:53,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 10:58:53,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:53,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:53,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 10:58:53,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:53,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 10:58:53,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +35: [2023-04-29 10:58:53,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:53,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:53,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:53,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:53,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:53,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:53,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:53,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:53,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:53,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 10:58:53,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 10:58:53,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 10:58:53,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +32: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:53,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 10:58:53,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:53,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:53,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 10:58:53,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:53,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:53,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +48: [2023-04-29 10:58:53,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:53,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 10:58:53,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 10:58:53,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 10:58:53,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 10:58:53,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 10:58:53,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 10:58:53,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:53,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 10:58:53,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:53,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 10:58:53,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:53,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:53,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 10:58:53,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 10:58:53,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +40: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:53,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +17: [2023-04-29 10:58:53,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:53,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:53,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 10:58:53,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:53,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 10:58:53,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +22: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +49: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 10:58:53,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 10:58:53,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +20: [2023-04-29 10:58:53,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +20: [2023-04-29 10:58:53,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:53,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +20: [2023-04-29 10:58:53,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:53,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 10:58:53,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 10:58:53,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +49: [2023-04-29 10:58:53,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:53,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:53,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 10:58:53,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 10:58:53,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 9: [2023-04-29 10:58:53,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 10:58:53,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:53,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 10:58:53,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 10:58:53,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:53,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:53,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +50: [2023-04-29 10:58:53,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 10:58:53,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 10:58:53,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:53,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 10:58:53,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:53,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:53,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +29: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +36: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:53,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:53,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 10:58:53,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 10:58:53,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:53,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 10:58:53,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:53,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:53,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +38: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:53,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:53,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 10:58:53,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +22: [2023-04-29 10:58:53,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +11: [2023-04-29 10:58:53,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +22: [2023-04-29 10:58:53,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:53,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:53,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +58: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +38: [2023-04-29 10:58:53,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 10:58:53,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +38: [2023-04-29 10:58:53,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 10:58:53,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +63: [2023-04-29 10:58:53,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 10:58:53,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 10:58:53,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:53,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 10:58:53,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:53,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:53,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 10:58:53,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:53,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:53,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 10:58:53,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:53,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:53,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:53,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 10:58:53,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:53,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +11: [2023-04-29 10:58:53,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:53,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +24: [2023-04-29 10:58:53,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +24: [2023-04-29 10:58:53,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:53,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +32: [2023-04-29 10:58:53,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +11: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 10:58:53,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:53,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:53,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:53,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:53,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:53,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 10:58:53,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:53,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:53,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 10:58:53,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +24: [2023-04-29 10:58:53,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +45: [2023-04-29 10:58:53,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:53,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 10:58:53,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:53,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 10:58:53,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 10:58:53,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +36: [2023-04-29 10:58:53,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:53,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 10:58:53,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 10:58:53,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 10:58:53,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 10:58:53,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:53,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:53,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:53,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:53,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 10:58:53,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 10:58:53,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 10:58:53,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:53,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:53,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 10:58:53,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:53,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:53,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +30: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:53,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:53,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:53,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:53,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:53,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 10:58:53,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +18: [2023-04-29 10:58:53,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 10:58:53,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:53,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +44: [2023-04-29 10:58:53,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:53,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +18: [2023-04-29 10:58:53,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +37: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 10:58:53,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:53,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:53,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 10:58:53,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:53,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:53,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:53,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 10:58:53,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 10:58:53,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +21: [2023-04-29 10:58:53,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 10:58:53,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 10:58:53,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 10:58:53,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:53,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 10:58:53,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 3: [2023-04-29 10:58:53,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:53,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:53,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 10:58:53,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:53,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 10:58:53,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 10:58:53,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 10:58:53,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +50: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +41: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 10:58:53,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:53,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:53,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:53,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:53,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:53,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 10:58:53,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 10:58:53,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 10:58:53,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 10:58:53,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +12: [2023-04-29 10:58:53,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:53,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +18: [2023-04-29 10:58:53,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 10:58:53,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:53,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +35: [2023-04-29 10:58:53,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +35: [2023-04-29 10:58:53,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 9: [2023-04-29 10:58:53,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 10:58:53,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +18: [2023-04-29 10:58:53,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:53,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +38: [2023-04-29 10:58:53,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:53,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:53,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 10:58:53,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:53,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +55: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +55: [2023-04-29 10:58:53,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:53,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:53,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:53,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 10:58:53,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 10:58:53,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:53,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:53,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:53,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 10:58:53,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 10:58:53,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +55: [2023-04-29 10:58:53,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:53,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:53,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:53,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 10:58:53,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 10:58:53,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:53,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +20: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +52: [2023-04-29 10:58:53,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 10:58:53,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 10:58:53,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +20: [2023-04-29 10:58:53,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +20: [2023-04-29 10:58:53,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 10:58:53,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:53,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 10:58:53,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +53: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +53: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +55: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +53: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 10:58:53,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 5: [2023-04-29 10:58:53,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 10:58:53,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 10:58:53,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 10:58:53,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 8: [2023-04-29 10:58:53,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:53,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 10:58:54,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +19: [2023-04-29 10:58:54,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 10:58:54,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:54,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +63: [2023-04-29 10:58:54,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +19: [2023-04-29 10:58:54,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +38: [2023-04-29 10:58:54,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:54,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:54,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:54,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +63: [2023-04-29 10:58:54,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +19: [2023-04-29 10:58:54,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +54: [2023-04-29 10:58:54,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +54: [2023-04-29 10:58:54,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +54: [2023-04-29 10:58:54,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +54: [2023-04-29 10:58:54,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 10:58:54,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:54,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:54,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 10:58:54,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 10:58:54,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +52: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 10:58:54,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 10:58:54,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 10:58:54,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 10:58:54,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 10:58:54,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:54,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +52: [2023-04-29 10:58:54,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 10:58:54,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 10:58:54,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:54,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:54,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:54,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 10:58:54,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:54,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:54,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:54,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:54,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 10:58:54,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 10:58:54,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +33: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:54,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +12: [2023-04-29 10:58:54,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:54,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:54,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:54,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:54,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:54,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:54,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 10:58:54,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:54,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:54,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:54,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:54,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:54,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:54,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:54,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 10:58:54,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 10:58:54,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:54,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:54,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 10:58:54,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:54,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 10:58:54,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 10:58:54,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 10:58:54,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 10:58:54,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 10:58:54,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 10:58:54,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:54,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:54,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 10:58:54,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +54: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:54,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 10:58:54,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 10:58:54,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 10:58:54,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:54,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:54,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 10:58:54,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +37: [2023-04-29 10:58:54,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 10:58:54,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +13: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 3: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +23: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +23: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +23: [2023-04-29 10:58:54,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 10:58:54,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:54,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 10:58:54,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:54,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +46: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +46: [2023-04-29 10:58:54,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 2: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +34: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +42: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +42: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +42: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 2: [2023-04-29 10:58:54,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +46: [2023-04-29 10:58:54,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +13: [2023-04-29 10:58:54,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:54,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:54,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:54,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:54,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:54,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 10:58:54,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 10:58:54,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:54,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 10:58:54,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:54,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 10:58:54,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:54,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:54,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:54,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 10:58:54,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:54,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +27: [2023-04-29 10:58:54,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:54,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:54,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:54,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 10:58:54,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +27: [2023-04-29 10:58:54,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 10:58:54,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:54,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 10:58:54,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:54,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 10:58:54,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:54,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 10:58:54,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:54,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:54,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 10:58:54,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 10:58:54,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +13: [2023-04-29 10:58:54,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:54,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:54,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:54,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 10:58:54,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 10:58:54,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 10:58:54,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +42: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +39: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 10:58:54,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +39: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 10:58:54,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +21: [2023-04-29 10:58:54,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 10:58:54,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 10:58:54,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 10:58:54,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 10:58:54,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 10:58:54,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:54,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +52: [2023-04-29 10:58:54,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 10:58:54,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 10:58:54,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +47: [2023-04-29 10:58:54,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 10:58:54,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 10:58:54,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 10:58:54,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 10:58:54,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 10:58:54,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 10:58:54,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 10:58:54,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 10:58:54,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 10:58:54,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +47: [2023-04-29 10:58:54,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:54,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +52: [2023-04-29 10:58:54,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 10:58:54,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 10:58:54,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:54,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:54,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt... +27: [2023-04-29 10:58:54,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:54,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:54,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:54,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 10:58:54,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +63: [2023-04-29 10:58:54,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:54,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:54,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:54,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:54,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +63: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +14: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +29: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +14: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +54: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +29: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +29: [2023-04-29 10:58:54,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +54: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +14: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:54,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +14: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +32: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:54,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:54,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:54,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +14: [2023-04-29 10:58:54,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +14: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +58: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +58: [2023-04-29 10:58:54,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +16: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:54,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 10:58:54,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 10:58:54,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +46: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +44: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:54,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:54,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +29: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +18: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +26: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:54,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +55: [2023-04-29 10:58:54,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:54,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 10:58:54,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +52: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 10:58:54,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 10:58:54,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:54,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:54,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +23: [2023-04-29 10:58:54,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +33: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 10:58:54,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:54,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 10:58:54,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 10:58:54,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:54,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +17: [2023-04-29 10:58:54,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +26: [2023-04-29 10:58:54,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +55: [2023-04-29 10:58:54,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 3: [2023-04-29 10:58:54,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 10:58:54,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +23: [2023-04-29 10:58:54,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 10:58:54,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:54,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +26: [2023-04-29 10:58:54,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:54,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:54,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:54,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +10: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +39: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:54,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 10:58:54,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 10:58:54,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +21: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 10:58:54,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:54,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 10:58:54,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +16: [2023-04-29 10:58:54,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +47: [2023-04-29 10:58:54,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +17: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:54,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 1: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +60: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +60: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +39: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 2: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +21: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +60: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 6: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 10:58:54,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +53: [2023-04-29 10:58:54,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:54,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:54,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +47: [2023-04-29 10:58:54,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 10:58:54,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:54,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 10:58:54,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 10:58:54,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 10:58:54,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 10:58:54,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 10:58:54,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +21: [2023-04-29 10:58:54,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +27: [2023-04-29 10:58:54,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 10:58:54,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +27: [2023-04-29 10:58:54,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 10:58:54,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +26: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +46: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +47: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 10:58:54,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +47: [2023-04-29 10:58:54,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +26: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 10:58:54,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 10:58:54,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 10:58:54,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 10:58:54,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 10:58:54,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:54,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +32: [2023-04-29 10:58:54,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 10:58:54,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:54,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:54,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:54,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 10:58:54,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 10:58:54,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:54,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +23: [2023-04-29 10:58:54,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 10:58:54,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +47: [2023-04-29 10:58:54,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:54,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +13: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +14: [2023-04-29 10:58:54,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:54,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:54,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:54,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:54,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 10:58:54,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 10:58:54,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 10:58:54,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:54,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 10:58:54,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 10:58:54,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 10:58:54,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +18: [2023-04-29 10:58:54,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +19: [2023-04-29 10:58:54,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 10:58:54,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 10:58:54,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +27: [2023-04-29 10:58:54,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 10:58:54,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +27: [2023-04-29 10:58:54,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 10:58:54,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:54,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +52: [2023-04-29 10:58:54,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 10:58:54,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 10:58:54,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 10:58:54,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:54,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 10:58:54,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +50: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +52: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +50: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 10:58:54,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 10:58:54,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 10:58:54,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +18: [2023-04-29 10:58:54,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 10:58:54,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +52: [2023-04-29 10:58:54,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 10:58:54,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 10:58:54,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:54,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:54,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 10:58:54,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:54,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:54,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +40: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 10:58:54,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +18: [2023-04-29 10:58:54,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:54,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:54,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 10:58:54,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:54,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 10:58:54,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 10:58:54,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 10:58:54,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 10:58:54,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 10:58:54,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:54,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:54,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:54,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:54,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:54,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:54,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 10:58:54,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +36: [2023-04-29 10:58:54,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:54,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:54,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:54,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:54,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 10:58:54,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 10:58:54,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:54,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:54,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 6: [2023-04-29 10:58:54,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 10:58:54,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 10:58:54,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:54,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:54,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 10:58:54,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 10:58:54,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 10:58:54,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +28: [2023-04-29 10:58:54,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 6: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 10:58:54,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +49: [2023-04-29 10:58:54,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 10:58:54,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +16: [2023-04-29 10:58:54,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +49: [2023-04-29 10:58:54,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 10:58:54,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +26: [2023-04-29 10:58:54,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 10:58:54,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +49: [2023-04-29 10:58:54,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 10:58:54,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:54,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 10:58:54,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +43: [2023-04-29 10:58:54,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:54,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +43: [2023-04-29 10:58:54,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:54,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:54,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:54,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 10:58:54,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 10:58:54,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:54,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:54,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 10:58:54,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:54,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 10:58:54,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 10:58:54,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 10:58:54,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:54,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:54,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 10:58:54,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 10:58:54,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +51: [2023-04-29 10:58:54,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:54,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 10:58:54,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:54,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 10:58:54,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +60: [2023-04-29 10:58:54,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 10:58:54,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +26: [2023-04-29 10:58:54,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +48: [2023-04-29 10:58:54,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:54,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 10:58:54,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +33: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +48: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:54,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:54,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 10:58:54,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +48: [2023-04-29 10:58:54,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +22: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +48: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 10:58:54,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +48: [2023-04-29 10:58:54,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +19: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +48: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 10:58:54,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +15: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 10:58:54,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 10:58:54,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:54,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 10:58:54,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 10:58:54,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 10:58:54,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 10:58:54,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 10:58:54,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 6: [2023-04-29 10:58:54,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 10:58:54,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:54,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 10:58:54,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 10:58:54,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:54,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 10:58:54,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +11: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +45: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 10:58:54,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +59: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +54: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 10:58:54,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:54,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +24: [2023-04-29 10:58:54,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:54,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 10:58:54,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:54,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 10:58:54,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 10:58:54,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 10:58:54,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 10:58:54,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:54,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:54,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 10:58:54,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +50: [2023-04-29 10:58:54,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:54,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 10:58:54,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 10:58:54,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 10:58:54,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 10:58:54,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:54,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:54,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 10:58:54,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 10:58:54,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 10:58:54,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 10:58:54,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 10:58:54,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +24: [2023-04-29 10:58:54,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:54,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:54,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 10:58:54,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +22: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +39: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +39: [2023-04-29 10:58:54,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +22: [2023-04-29 10:58:54,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 10:58:54,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +22: [2023-04-29 10:58:54,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 10:58:54,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 10:58:54,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 10:58:54,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 10:58:54,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:54,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:54,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:54,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 10:58:54,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +59: [2023-04-29 10:58:54,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:54,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:54,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 10:58:54,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:54,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 10:58:54,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 10:58:54,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 10:58:54,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 10:58:54,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +49: [2023-04-29 10:58:54,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:54,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 10:58:54,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 10:58:54,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:54,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:54,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +40: [2023-04-29 10:58:54,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 10:58:54,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 10:58:54,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 10:58:54,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 10:58:54,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +49: [2023-04-29 10:58:54,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 10:58:54,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:54,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +49: [2023-04-29 10:58:54,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +59: [2023-04-29 10:58:54,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 10:58:54,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +24: [2023-04-29 10:58:54,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 10:58:54,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:54,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:54,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:54,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 10:58:54,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 10:58:54,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:54,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:54,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:54,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 10:58:54,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 10:58:54,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:54,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 10:58:54,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 10:58:54,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +15: [2023-04-29 10:58:54,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +15: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +43: [2023-04-29 10:58:54,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:54,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 10:58:54,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 10:58:54,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:54,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +36: [2023-04-29 10:58:54,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:54,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:54,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 10:58:54,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +61: [2023-04-29 10:58:54,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +61: [2023-04-29 10:58:54,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 10:58:54,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +61: [2023-04-29 10:58:54,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 10:58:54,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +17: [2023-04-29 10:58:54,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:54,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:54,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:54,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 6: [2023-04-29 10:58:54,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +54: [2023-04-29 10:58:54,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 10:58:54,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:54,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:54,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 10:58:54,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:54,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:54,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:54,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:54,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 10:58:54,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:54,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +36: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 10:58:54,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +47: [2023-04-29 10:58:54,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:54,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 10:58:54,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:54,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:54,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:54,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +33: [2023-04-29 10:58:54,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 10:58:54,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 10:58:54,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 10:58:54,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 10:58:54,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +43: [2023-04-29 10:58:54,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:54,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 10:58:54,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +45: [2023-04-29 10:58:54,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 6: [2023-04-29 10:58:54,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +30: [2023-04-29 10:58:54,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +41: [2023-04-29 10:58:54,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +30: [2023-04-29 10:58:54,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 10:58:54,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 10:58:54,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:54,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:54,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 10:58:54,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 10:58:54,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +30: [2023-04-29 10:58:54,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:54,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:54,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 10:58:54,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:54,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 10:58:54,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +33: [2023-04-29 10:58:54,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 10:58:54,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 10:58:54,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:54,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 10:58:54,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 10:58:54,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +57: [2023-04-29 10:58:54,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 10:58:54,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:54,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 10:58:54,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +56: [2023-04-29 10:58:54,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +12: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +12: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +54: [2023-04-29 10:58:54,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 10:58:54,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt. +22: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 10:58:54,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 10:58:54,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +61: [2023-04-29 10:58:54,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:54,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 10:58:54,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +54: [2023-04-29 10:58:54,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +22: [2023-04-29 10:58:54,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +22: [2023-04-29 10:58:54,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 10:58:54,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 10:58:54,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +62: [2023-04-29 10:58:54,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 10:58:54,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 10:58:54,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +22: [2023-04-29 10:58:54,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 10:58:54,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +22: [2023-04-29 10:58:54,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 10:58:54,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 10:58:54,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 10:58:54,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 10:58:54,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 10:58:54,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 10:58:54,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +59: [2023-04-29 10:58:54,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:54,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 10:58:54,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:54,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 10:58:54,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 10:58:54,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 10:58:54,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:54,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:54,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 10:58:54,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:54,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:54,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:54,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:54,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:54,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 10:58:54,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +39: [2023-04-29 10:58:54,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 10:58:54,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 10:58:54,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 10:58:54,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 10:58:54,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 10:58:54,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 10:58:54,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:54,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +18: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:54,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 10:58:54,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 10:58:54,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 10:58:54,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:54,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 10:58:54,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 10:58:54,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 10:58:54,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 10:58:54,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 10:58:54,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 10:58:54,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +21: [2023-04-29 10:58:54,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +62: [2023-04-29 10:58:54,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 10:58:54,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +48: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +48: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:54,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:54,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +48: [2023-04-29 10:58:54,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 10:58:54,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +47: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 8: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:54,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +22: [2023-04-29 10:58:54,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 10:58:54,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:54,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:54,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 10:58:54,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:54,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:54,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +22: [2023-04-29 10:58:54,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 10:58:54,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 10:58:54,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 10:58:54,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +61: [2023-04-29 10:58:54,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:54,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:54,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:54,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 10:58:54,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:54,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 10:58:54,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 10:58:54,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +36: [2023-04-29 10:58:54,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:54,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:54,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:54,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 10:58:54,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +17: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +48: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:54,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +34: [2023-04-29 10:58:54,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 10:58:54,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:54,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:54,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 10:58:54,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +51: [2023-04-29 10:58:54,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 10:58:54,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 10:58:54,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 10:58:54,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 10:58:54,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 10:58:54,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +59: [2023-04-29 10:58:54,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:54,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +51: [2023-04-29 10:58:54,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +25: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +61: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +25: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +51: [2023-04-29 10:58:54,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 10:58:54,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +59: [2023-04-29 10:58:54,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 10:58:54,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 10:58:54,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 10:58:54,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 10:58:54,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 10:58:54,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:54,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 10:58:54,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 10:58:54,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 10:58:54,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:54,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 10:58:54,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 10:58:54,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +44: [2023-04-29 10:58:54,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:54,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:54,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 10:58:54,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 10:58:54,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +31: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +37: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 10:58:54,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 10:58:54,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +18: [2023-04-29 10:58:54,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 10:58:54,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +59: [2023-04-29 10:58:54,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 0: [2023-04-29 10:58:54,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +52: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 10:58:54,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:54,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +44: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +44: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:54,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:54,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:54,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 10:58:54,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 10:58:54,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +18: [2023-04-29 10:58:54,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 10:58:54,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:54,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 10:58:54,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 10:58:54,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:54,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:54,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 10:58:54,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +18: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:54,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +51: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 10:58:54,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +45: [2023-04-29 10:58:54,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +41: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 10:58:54,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +53: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +12: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +62: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:54,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 10:58:54,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 10:58:54,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 10:58:54,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 10:58:54,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +21: [2023-04-29 10:58:54,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 10:58:54,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 10:58:54,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +32: [2023-04-29 10:58:54,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +12: [2023-04-29 10:58:54,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +41: [2023-04-29 10:58:54,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:54,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 10:58:54,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 10:58:54,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:54,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 10:58:54,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 10:58:54,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 10:58:54,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 10:58:54,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 10:58:54,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 10:58:54,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 10:58:54,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:54,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 10:58:54,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:54,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 10:58:54,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 10:58:54,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:54,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 10:58:54,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 10:58:54,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 10:58:54,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 10:58:54,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 10:58:54,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 10:58:54,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +34: [2023-04-29 10:58:54,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:54,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 10:58:54,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:54,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +48: [2023-04-29 10:58:54,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 10:58:54,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +53: [2023-04-29 10:58:54,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 10:58:54,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:54,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 10:58:54,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +18: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:54,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +53: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:54,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:54,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +48: [2023-04-29 10:58:54,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 10:58:54,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +10: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +10: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +42: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +10: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +48: [2023-04-29 10:58:54,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 10:58:54,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:54,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 10:58:54,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:54,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:54,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 10:58:54,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 10:58:54,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 10:58:54,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:54,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 10:58:54,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:54,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:54,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:54,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:54,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:54,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:54,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +32: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:54,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 10:58:54,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:54,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +50: [2023-04-29 10:58:54,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:54,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 10:58:54,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:54,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 10:58:54,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 10:58:54,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 10:58:54,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +24: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +34: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +23: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 10:58:54,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 10:58:54,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +43: [2023-04-29 10:58:54,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +23: [2023-04-29 10:58:54,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 10:58:54,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 10:58:54,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:54,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 10:58:54,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 10:58:54,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 10:58:54,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:54,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +23: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 10:58:54,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:54,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:54,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 10:58:54,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +10: [2023-04-29 10:58:54,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +43: [2023-04-29 10:58:54,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +45: [2023-04-29 10:58:54,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:54,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +10: [2023-04-29 10:58:54,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 10:58:54,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +43: [2023-04-29 10:58:54,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +49: [2023-04-29 10:58:54,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 10:58:54,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 10:58:54,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 10:58:54,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +45: [2023-04-29 10:58:54,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 10:58:54,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 10:58:54,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 10:58:54,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 10:58:54,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:54,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +51: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 10:58:54,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 10:58:54,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:54,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:54,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +25: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +37: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 10:58:54,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:54,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 10:58:54,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 10:58:54,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +37: [2023-04-29 10:58:54,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +25: [2023-04-29 10:58:54,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 10:58:54,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 10:58:54,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +37: [2023-04-29 10:58:54,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 10:58:54,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 10:58:54,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:54,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 10:58:54,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +52: [2023-04-29 10:58:54,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 10:58:54,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +52: [2023-04-29 10:58:54,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 10:58:54,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 10:58:54,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:54,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 10:58:54,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 9: [2023-04-29 10:58:54,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 10:58:54,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +37: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +20: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +20: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +40: [2023-04-29 10:58:54,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +20: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +52: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +52: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 8: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +53: [2023-04-29 10:58:54,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 10:58:54,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:54,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 10:58:54,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 10:58:54,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +31: [2023-04-29 10:58:54,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +40: [2023-04-29 10:58:54,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 10:58:54,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +45: [2023-04-29 10:58:54,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:54,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +58: [2023-04-29 10:58:54,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:54,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 10:58:54,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +50: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 10:58:54,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 10:58:54,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 10:58:54,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 10:58:54,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 10:58:54,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:54,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +52: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:54,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:54,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 10:58:54,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 10:58:54,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +49: [2023-04-29 10:58:54,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +38: [2023-04-29 10:58:54,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:54,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +53: [2023-04-29 10:58:54,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +39: [2023-04-29 10:58:54,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 10:58:54,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 10:58:54,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 10:58:54,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:54,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:54,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 10:58:54,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +32: [2023-04-29 10:58:54,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 10:58:54,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 10:58:54,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 10:58:54,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 10:58:54,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:54,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 10:58:54,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 10:58:54,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +32: [2023-04-29 10:58:54,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +23: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 10:58:54,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... + 9: [2023-04-29 10:58:54,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 10:58:54,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 10:58:54,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 10:58:54,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:54,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:54,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:54,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 10:58:54,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 10:58:54,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 10:58:54,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:54,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:54,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 10:58:54,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:54,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:54,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:54,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:54,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt... +29: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 10:58:54,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 10:58:54,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:54,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:54,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:54,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:54,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +10: [2023-04-29 10:58:54,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 10:58:54,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 10:58:54,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:54,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:54,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +35: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 10:58:54,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +42: [2023-04-29 10:58:54,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:54,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 10:58:54,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +58: [2023-04-29 10:58:54,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 10:58:54,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:54,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +34: [2023-04-29 10:58:54,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 10:58:54,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:54,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:54,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 10:58:54,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 10:58:54,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:54,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +14: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +14: [2023-04-29 10:58:54,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +14: [2023-04-29 10:58:54,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 10:58:54,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 10:58:54,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 10:58:54,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 10:58:54,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:54,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:54,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 10:58:54,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:54,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +55: [2023-04-29 10:58:54,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:54,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 10:58:54,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:54,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +31: [2023-04-29 10:58:54,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +32: [2023-04-29 10:58:54,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:54,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 10:58:54,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 10:58:54,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:54,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +14: [2023-04-29 10:58:54,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +39: [2023-04-29 10:58:54,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:54,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 10:58:54,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +58: [2023-04-29 10:58:54,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 10:58:54,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +60: [2023-04-29 10:58:54,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 10:58:54,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 10:58:54,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:54,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:54,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +55: [2023-04-29 10:58:54,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 10:58:54,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 10:58:54,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:54,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 10:58:54,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +58: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:54,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 10:58:54,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:54,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 10:58:54,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:54,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:54,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 10:58:54,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +55: [2023-04-29 10:58:54,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 9: [2023-04-29 10:58:54,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +24: [2023-04-29 10:58:54,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 10:58:54,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:54,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 10:58:54,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:54,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 1: [2023-04-29 10:58:54,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 10:58:54,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:54,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +39: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:54,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +20: [2023-04-29 10:58:54,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 10:58:54,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:54,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:54,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +52: [2023-04-29 10:58:54,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 10:58:54,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:54,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:54,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +60: [2023-04-29 10:58:54,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:54,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 10:58:54,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:54,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:54,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:54,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 10:58:54,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:54,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 10:58:54,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:54,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:54,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:54,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 10:58:54,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +15: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 10:58:54,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 10:58:54,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 10:58:54,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 10:58:54,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 10:58:54,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 10:58:54,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:54,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:54,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:54,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:54,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:54,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 10:58:54,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 10:58:54,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt. +47: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 10:58:54,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 10:58:54,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:54,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:54,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 10:58:54,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 10:58:54,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:54,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:54,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 10:58:54,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 10:58:54,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 10:58:54,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 10:58:54,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:54,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:54,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:54,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +19: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +19: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +19: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 10:58:54,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 10:58:54,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 10:58:54,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:54,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:54,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:54,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +15: [2023-04-29 10:58:54,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 10:58:54,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:54,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:54,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 6: [2023-04-29 10:58:54,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 10:58:54,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:54,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 10:58:54,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +14: [2023-04-29 10:58:54,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +24: [2023-04-29 10:58:54,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 6: [2023-04-29 10:58:54,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +32: [2023-04-29 10:58:54,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 10:58:54,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:54,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:54,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 10:58:54,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +56: [2023-04-29 10:58:54,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +46: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:54,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:54,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 10:58:54,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 10:58:54,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 10:58:54,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 10:58:54,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:54,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:54,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:54,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:54,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 10:58:54,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 10:58:54,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 10:58:54,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:54,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:54,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 10:58:54,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 10:58:54,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:54,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +11: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +11: [2023-04-29 10:58:54,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +11: [2023-04-29 10:58:54,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 10:58:54,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:54,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 10:58:54,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:54,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:54,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 10:58:54,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:54,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 10:58:54,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 10:58:54,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 10:58:54,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +40: [2023-04-29 10:58:54,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:54,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:54,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:54,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:54,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:54,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:54,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:54,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:54,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:54,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:54,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:54,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:54,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:54,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:54,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 10:58:54,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +15: [2023-04-29 10:58:54,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 10:58:54,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:54,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:54,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:54,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:54,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 10:58:54,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 10:58:54,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:54,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 10:58:54,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +15: [2023-04-29 10:58:54,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +56: [2023-04-29 10:58:54,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 10:58:54,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:54,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:54,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:54,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:54,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 10:58:54,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 10:58:54,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 10:58:54,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:54,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:54,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 10:58:54,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 10:58:54,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 10:58:54,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +30: [2023-04-29 10:58:54,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:54,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:54,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 10:58:54,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 10:58:54,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:54,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:54,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 10:58:54,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:54,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +12: [2023-04-29 10:58:54,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:54,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 10:58:54,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt. +47: [2023-04-29 10:58:54,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 10:58:54,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 6: [2023-04-29 10:58:54,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:54,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:54,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 10:58:54,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:54,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:54,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 10:58:54,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:54,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 10:58:54,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +53: [2023-04-29 10:58:54,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +15: [2023-04-29 10:58:54,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +19: [2023-04-29 10:58:54,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +33: [2023-04-29 10:58:54,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 10:58:54,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 10:58:54,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 10:58:54,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:54,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +16: [2023-04-29 10:58:54,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +16: [2023-04-29 10:58:54,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +16: [2023-04-29 10:58:54,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +40: [2023-04-29 10:58:54,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:54,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +36: [2023-04-29 10:58:54,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:54,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +31: [2023-04-29 10:58:54,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +31: [2023-04-29 10:58:54,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +31: [2023-04-29 10:58:54,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 6: [2023-04-29 10:58:54,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 10:58:54,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +59: [2023-04-29 10:58:54,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:54,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:54,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 10:58:54,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +43: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 10:58:54,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +59: [2023-04-29 10:58:54,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +40: [2023-04-29 10:58:54,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +53: [2023-04-29 10:58:54,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +57: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 10:58:54,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 10:58:54,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:54,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:54,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +15: [2023-04-29 10:58:54,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:54,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:54,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 10:58:54,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:54,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 10:58:54,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 10:58:54,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:54,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 10:58:54,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +36: [2023-04-29 10:58:54,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 10:58:54,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +46: [2023-04-29 10:58:54,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 10:58:54,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:54,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 10:58:54,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 10:58:54,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:54,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:54,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:54,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 10:58:54,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 10:58:54,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 10:58:54,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:54,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:54,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 10:58:54,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:54,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +36: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:54,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +36: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:54,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 10:58:54,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 10:58:54,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +59: [2023-04-29 10:58:54,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:54,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:54,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:54,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +40: [2023-04-29 10:58:54,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:54,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 10:58:54,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 10:58:54,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:54,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:54,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:54,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 10:58:54,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 10:58:54,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:54,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +53: [2023-04-29 10:58:54,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:54,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 10:58:54,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:54,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +23: [2023-04-29 10:58:54,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +23: [2023-04-29 10:58:54,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +40: [2023-04-29 10:58:54,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 10:58:54,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +59: [2023-04-29 10:58:54,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:54,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 10:58:54,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +22: [2023-04-29 10:58:54,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +22: [2023-04-29 10:58:54,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 10:58:54,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:54,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:54,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:54,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:54,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:54,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:54,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +48: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:54,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 10:58:54,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +57: [2023-04-29 10:58:54,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +48: [2023-04-29 10:58:54,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:54,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 10:58:54,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:54,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 10:58:54,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 10:58:54,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 10:58:54,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 7: [2023-04-29 10:58:54,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:54,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:54,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:54,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:54,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 10:58:54,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:54,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:54,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:54,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:54,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:54,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:54,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 10:58:54,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 10:58:54,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:54,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:54,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:54,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +31: [2023-04-29 10:58:54,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:54,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 10:58:54,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:54,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:54,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:54,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 10:58:54,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:54,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:54,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 10:58:54,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:54,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 10:58:54,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 10:58:54,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +31: [2023-04-29 10:58:54,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +21: [2023-04-29 10:58:54,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:54,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:54,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 10:58:54,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 10:58:54,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:54,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +18: [2023-04-29 10:58:54,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:54,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:54,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:54,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:54,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:54,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:54,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:54,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 10:58:54,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:54,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:54,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:54,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:54,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:54,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:54,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:54,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 10:58:54,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:54,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 10:58:54,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 10:58:54,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +29: [2023-04-29 10:58:54,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +28: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +28: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +28: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +28: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 10:58:54,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 10:58:54,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 10:58:54,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 10:58:54,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:54,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 10:58:54,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +48: [2023-04-29 10:58:54,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 10:58:54,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 10:58:54,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:54,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 10:58:54,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +20: [2023-04-29 10:58:54,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 10:58:54,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +23: [2023-04-29 10:58:54,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 10:58:54,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 10:58:54,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 10:58:54,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:54,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 10:58:54,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:54,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 10:58:54,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:54,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 7: [2023-04-29 10:58:54,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +38: [2023-04-29 10:58:54,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:54,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +23: [2023-04-29 10:58:54,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +38: [2023-04-29 10:58:54,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 10:58:54,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:54,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 10:58:54,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 10:58:54,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 10:58:54,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 10:58:54,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 10:58:54,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +45: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 10:58:54,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:54,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 10:58:54,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +25: [2023-04-29 10:58:54,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +29: [2023-04-29 10:58:54,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:54,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +45: [2023-04-29 10:58:54,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:54,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 10:58:54,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 10:58:54,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:54,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:54,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 10:58:54,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +51: [2023-04-29 10:58:54,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:54,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:54,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 10:58:54,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +48: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:54,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:54,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:54,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +51: [2023-04-29 10:58:54,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 10:58:54,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:54,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:54,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 10:58:54,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 10:58:54,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 10:58:54,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +20: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +48: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +44: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 10:58:55,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:55,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 10:58:55,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:55,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 10:58:55,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +48: [2023-04-29 10:58:55,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:55,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +38: [2023-04-29 10:58:55,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:55,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:55,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:55,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 10:58:55,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +18: [2023-04-29 10:58:55,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 10:58:55,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 10:58:55,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:55,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +13: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +13: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 10:58:55,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 10:58:55,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:55,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:55,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 10:58:55,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 10:58:55,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:55,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 10:58:55,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +50: [2023-04-29 10:58:55,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:55,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 10:58:55,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:55,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 10:58:55,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 10:58:55,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 10:58:55,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:55,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:55,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:55,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 10:58:55,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:55,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +14: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 10:58:55,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:55,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:55,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 10:58:55,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 10:58:55,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:55,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 10:58:55,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:55,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:55,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 10:58:55,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +45: [2023-04-29 10:58:55,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 10:58:55,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +21: [2023-04-29 10:58:55,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +21: [2023-04-29 10:58:55,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +21: [2023-04-29 10:58:55,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +45: [2023-04-29 10:58:55,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:55,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +45: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 10:58:55,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 10:58:55,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:55,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +11: [2023-04-29 10:58:55,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +11: [2023-04-29 10:58:55,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 10:58:55,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +11: [2023-04-29 10:58:55,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:55,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:55,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 10:58:55,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +49: [2023-04-29 10:58:55,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:55,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:55,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 10:58:55,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 10:58:55,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 10:58:55,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 10:58:55,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 10:58:55,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +17: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +35: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +17: [2023-04-29 10:58:55,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 10:58:55,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +35: [2023-04-29 10:58:55,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 10:58:55,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:55,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:55,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt... +38: [2023-04-29 10:58:55,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt... +38: [2023-04-29 10:58:55,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt... +38: [2023-04-29 10:58:55,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt... +45: [2023-04-29 10:58:55,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 10:58:55,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +21: [2023-04-29 10:58:55,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:55,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:55,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:55,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:55,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:55,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:55,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:55,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 10:58:55,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:55,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 10:58:55,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +36: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +36: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 10:58:55,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 10:58:55,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:55,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:55,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 10:58:55,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 10:58:55,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 10:58:55,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 10:58:55,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:55,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:55,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:55,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 10:58:55,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 10:58:55,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 10:58:55,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:55,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:55,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:55,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 10:58:55,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +63: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +63: [2023-04-29 10:58:55,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 10:58:55,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +44: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +44: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 10:58:55,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 10:58:55,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +50: [2023-04-29 10:58:55,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:55,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:55,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 10:58:55,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +26: [2023-04-29 10:58:55,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +26: [2023-04-29 10:58:55,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +26: [2023-04-29 10:58:55,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +26: [2023-04-29 10:58:55,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +36: [2023-04-29 10:58:55,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 10:58:55,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 10:58:55,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +57: [2023-04-29 10:58:55,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +36: [2023-04-29 10:58:55,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:55,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:55,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +11: [2023-04-29 10:58:55,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +41: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +41: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +33: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +33: [2023-04-29 10:58:55,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 10:58:55,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:55,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +35: [2023-04-29 10:58:55,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +35: [2023-04-29 10:58:55,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 8: [2023-04-29 10:58:55,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +35: [2023-04-29 10:58:55,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +35: [2023-04-29 10:58:55,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 10:58:55,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 10:58:55,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 10:58:55,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 10:58:55,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 10:58:55,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 10:58:55,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 10:58:55,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:55,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:55,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:55,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 10:58:55,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 10:58:55,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt... +45: [2023-04-29 10:58:55,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt... +45: [2023-04-29 10:58:55,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt... +45: [2023-04-29 10:58:55,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +57: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:55,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt... +44: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt... +44: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt... +44: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt... +26: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:55,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 10:58:55,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 10:58:55,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 10:58:55,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:55,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 10:58:55,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:55,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 10:58:55,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +16: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +16: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 10:58:55,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 10:58:55,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 10:58:55,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 10:58:55,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:55,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 10:58:55,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 10:58:55,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +21: [2023-04-29 10:58:55,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +57: [2023-04-29 10:58:55,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:55,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +60: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +50: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt... +50: [2023-04-29 10:58:55,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt... +50: [2023-04-29 10:58:55,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt... +50: [2023-04-29 10:58:55,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt... +59: [2023-04-29 10:58:55,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 10:58:55,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +42: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 10:58:55,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:55,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:55,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 10:58:55,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 10:58:55,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:55,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:55,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:55,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:55,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +42: [2023-04-29 10:58:55,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:55,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +17: [2023-04-29 10:58:55,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 10:58:55,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 10:58:55,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:55,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:55,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:55,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +41: [2023-04-29 10:58:55,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt... +41: [2023-04-29 10:58:55,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt... +41: [2023-04-29 10:58:55,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt... +17: [2023-04-29 10:58:55,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 10:58:55,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:55,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +59: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +47: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt... +17: [2023-04-29 10:58:55,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:55,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +35: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:55,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +47: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 10:58:55,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:55,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:55,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:55,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:55,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:55,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +28: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 1: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 10:58:55,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 1: [2023-04-29 10:58:55,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:55,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +41: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +36: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +41: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +42: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +42: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +28: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +42: [2023-04-29 10:58:55,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:55,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 10:58:55,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 10:58:55,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:55,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +46: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +46: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:55,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:55,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 10:58:55,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:55,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:55,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 10:58:55,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 10:58:55,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +46: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +20: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +20: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +20: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:55,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 10:58:55,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 10:58:55,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 10:58:55,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +27: [2023-04-29 10:58:55,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 10:58:55,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:55,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +63: [2023-04-29 10:58:55,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 10:58:55,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:55,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:55,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 10:58:55,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:55,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 10:58:55,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 10:58:55,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 10:58:55,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 10:58:55,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:55,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:55,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 10:58:55,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +46: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 10:58:55,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +49: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +27: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +26: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 10:58:55,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +42: [2023-04-29 10:58:55,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 10:58:55,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 10:58:55,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +42: [2023-04-29 10:58:55,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 10:58:55,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:55,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 10:58:55,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +63: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:55,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt... +49: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt... +26: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt... +62: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +49: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt... +46: [2023-04-29 10:58:55,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:55,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +23: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +46: [2023-04-29 10:58:55,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +58: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +26: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 10:58:55,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +54: [2023-04-29 10:58:55,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:55,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:55,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 10:58:55,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 10:58:55,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 10:58:55,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:55,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:55,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:55,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:55,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 10:58:55,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +60: [2023-04-29 10:58:55,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +18: [2023-04-29 10:58:55,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +54: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:55,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:55,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:55,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:55,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +45: [2023-04-29 10:58:55,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +45: [2023-04-29 10:58:55,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +56: [2023-04-29 10:58:55,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +47: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +45: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:55,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +47: [2023-04-29 10:58:55,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 10:58:55,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 10:58:55,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +33: [2023-04-29 10:58:55,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:55,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:55,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +35: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:55,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +35: [2023-04-29 10:58:55,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt... +35: [2023-04-29 10:58:55,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt... +57: [2023-04-29 10:58:55,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:55,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 10:58:55,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:55,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt... +32: [2023-04-29 10:58:55,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:55,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 10:58:55,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt... +55: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt... +55: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt... +55: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt... +32: [2023-04-29 10:58:55,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:55,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +56: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +32: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:55,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +10: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +35: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt... +54: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt... +54: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt... +54: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt... +54: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt... + 1: [2023-04-29 10:58:55,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 10:58:55,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:55,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 10:58:55,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +32: [2023-04-29 10:58:55,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +32: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +32: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +28: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:55,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 10:58:55,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +18: [2023-04-29 10:58:55,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 10:58:55,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +44: [2023-04-29 10:58:55,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 10:58:55,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 10:58:55,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +10: [2023-04-29 10:58:55,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:55,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:55,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 10:58:55,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +28: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +47: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +18: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 10:58:55,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 10:58:55,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 10:58:55,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 10:58:55,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +35: [2023-04-29 10:58:55,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 10:58:55,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +52: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +52: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +50: [2023-04-29 10:58:55,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +26: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +26: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 10:58:55,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:55,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +52: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 10:58:55,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 10:58:55,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 10:58:55,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +16: [2023-04-29 10:58:55,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +16: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +27: [2023-04-29 10:58:55,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +16: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:55,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +42: [2023-04-29 10:58:55,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 10:58:55,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:55,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 10:58:55,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:55,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:55,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 10:58:55,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +44: [2023-04-29 10:58:55,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 10:58:55,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 10:58:55,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +27: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:55,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +42: [2023-04-29 10:58:55,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 10:58:55,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 10:58:55,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 10:58:55,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 10:58:55,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +13: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +41: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 10:58:55,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:55,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +43: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +28: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +43: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +58: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +44: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +58: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +23: [2023-04-29 10:58:55,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +58: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +41: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 10:58:55,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 10:58:55,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +28: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +56: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +46: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +42: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +42: [2023-04-29 10:58:55,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:55,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 10:58:55,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 10:58:55,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +28: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 10:58:55,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +29: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +58: [2023-04-29 10:58:55,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +58: [2023-04-29 10:58:55,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +29: [2023-04-29 10:58:55,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +42: [2023-04-29 10:58:55,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 10:58:55,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +39: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 10:58:55,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:55,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +55: [2023-04-29 10:58:55,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:55,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +42: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:55,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:55,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 10:58:55,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 10:58:55,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +63: [2023-04-29 10:58:55,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 10:58:55,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt... +52: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt... +52: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt... +63: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt... +60: [2023-04-29 10:58:55,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:55,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt... +42: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt... +42: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt... +42: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt... +63: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:55,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +63: [2023-04-29 10:58:55,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:55,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +32: [2023-04-29 10:58:55,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:55,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:55,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:55,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:55,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:55,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 10:58:55,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:55,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +18: [2023-04-29 10:58:55,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 10:58:55,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt... +47: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt... +47: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt... +47: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt... +18: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +19: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +13: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +13: [2023-04-29 10:58:55,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 10:58:55,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +46: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +18: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +19: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 10:58:55,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +18: [2023-04-29 10:58:55,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 10:58:55,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:55,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +46: [2023-04-29 10:58:55,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 10:58:55,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +45: [2023-04-29 10:58:55,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 10:58:55,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:55,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:55,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 10:58:55,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +46: [2023-04-29 10:58:55,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 10:58:55,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 10:58:55,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:55,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:55,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:55,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 10:58:55,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt... +58: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt... +58: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt... +58: [2023-04-29 10:58:55,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt... +34: [2023-04-29 10:58:55,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 10:58:55,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +32: [2023-04-29 10:58:55,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 10:58:55,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 10:58:55,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 10:58:55,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 10:58:55,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 10:58:55,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt... +61: [2023-04-29 10:58:55,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt... +61: [2023-04-29 10:58:55,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt... +61: [2023-04-29 10:58:55,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt... +45: [2023-04-29 10:58:55,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +23: [2023-04-29 10:58:55,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:55,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 10:58:55,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 10:58:55,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:55,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +23: [2023-04-29 10:58:55,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:55,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 10:58:55,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:55,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:55,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 10:58:55,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 10:58:55,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 10:58:55,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 10:58:55,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 10:58:55,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:55,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:55,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt... +37: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt... +37: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt... +37: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt... +13: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 10:58:55,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt... +39: [2023-04-29 10:58:55,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt... +39: [2023-04-29 10:58:55,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt... +39: [2023-04-29 10:58:55,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt... +50: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:55,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 10:58:55,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 10:58:55,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:55,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:55,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:55,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +53: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +10: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +28: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +21: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +21: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +40: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +57: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:55,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +29: [2023-04-29 10:58:55,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 10:58:55,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 10:58:55,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:55,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +28: [2023-04-29 10:58:55,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +40: [2023-04-29 10:58:55,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:55,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:55,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +16: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +33: [2023-04-29 10:58:55,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 10:58:55,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt... +63: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt... +33: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt... +63: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt... +43: [2023-04-29 10:58:55,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +29: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +44: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +33: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +44: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:55,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 10:58:55,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 10:58:55,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 10:58:55,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:55,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 10:58:55,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 10:58:55,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +50: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +28: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +53: [2023-04-29 10:58:55,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +57: [2023-04-29 10:58:55,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 10:58:55,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt... +60: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt... +60: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt... +56: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +40: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +40: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 10:58:55,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt... +46: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt... +46: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt... +46: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt... +46: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt... +32: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +32: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 10:58:55,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt... +56: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt... +56: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt... +56: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt... +28: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 10:58:55,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 10:58:55,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 10:58:55,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 10:58:55,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 10:58:55,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 10:58:55,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:55,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +24: [2023-04-29 10:58:55,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +24: [2023-04-29 10:58:55,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +21: [2023-04-29 10:58:55,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 10:58:55,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 10:58:55,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +21: [2023-04-29 10:58:55,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 10:58:55,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:55,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +25: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +25: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +48: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +48: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +25: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +21: [2023-04-29 10:58:55,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:55,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:55,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:55,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:55,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 10:58:55,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 10:58:55,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 10:58:55,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 10:58:55,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 10:58:55,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +11: [2023-04-29 10:58:55,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +11: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +34: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:55,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 10:58:55,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt... +32: [2023-04-29 10:58:55,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt... +32: [2023-04-29 10:58:55,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt... +53: [2023-04-29 10:58:55,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:55,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt... + 6: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 10:58:55,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:55,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:55,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 10:58:55,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 10:58:55,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 10:58:55,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 10:58:55,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 10:58:55,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 10:58:55,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:55,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:55,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 10:58:55,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 10:58:55,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 10:58:55,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 10:58:55,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:55,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 10:58:55,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 10:58:55,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:55,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 10:58:55,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 10:58:55,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +25: [2023-04-29 10:58:55,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 10:58:55,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 10:58:55,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +13: [2023-04-29 10:58:55,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +13: [2023-04-29 10:58:55,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 10:58:55,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 10:58:55,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 10:58:55,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 10:58:55,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +11: [2023-04-29 10:58:55,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 10:58:55,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 10:58:55,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 10:58:55,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 10:58:55,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 10:58:55,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +13: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +40: [2023-04-29 10:58:55,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:55,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 10:58:55,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 10:58:55,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 10:58:55,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 10:58:55,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +26: [2023-04-29 10:58:55,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +26: [2023-04-29 10:58:55,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +26: [2023-04-29 10:58:55,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +43: [2023-04-29 10:58:55,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +38: [2023-04-29 10:58:55,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 10:58:55,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:55,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:55,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 10:58:55,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 10:58:55,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +43: [2023-04-29 10:58:55,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:55,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:55,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +57: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 10:58:55,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 10:58:55,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 10:58:55,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 10:58:55,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:55,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 10:58:55,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 10:58:55,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +21: [2023-04-29 10:58:55,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 10:58:55,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:55,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:55,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +30: [2023-04-29 10:58:55,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 10:58:55,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +51: [2023-04-29 10:58:55,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 10:58:55,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:55,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 10:58:55,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 10:58:55,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 10:58:55,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 10:58:55,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:55,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 10:58:55,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 10:58:55,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +21: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +40: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +43: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +21: [2023-04-29 10:58:55,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +21: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +30: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +30: [2023-04-29 10:58:55,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +33: [2023-04-29 10:58:55,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 10:58:55,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +14: [2023-04-29 10:58:55,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +21: [2023-04-29 10:58:55,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +30: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +40: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:55,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 9: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +34: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 10:58:55,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 10:58:55,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:55,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +48: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:55,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +22: [2023-04-29 10:58:55,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +53: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 10:58:55,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:55,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:55,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +57: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +57: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 10:58:55,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +22: [2023-04-29 10:58:55,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 10:58:55,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:55,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:55,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:55,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:55,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:55,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 10:58:55,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 10:58:55,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:55,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:55,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +38: [2023-04-29 10:58:55,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt. +36: [2023-04-29 10:58:55,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,497] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 308 +36: [2023-04-29 10:58:55,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 10:58:55,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 10:58:55,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 10:58:55,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:55,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:55,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:55,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 10:58:55,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 10:58:55,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 10:58:55,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:55,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:55,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 10:58:55,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +10: [2023-04-29 10:58:55,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 10:58:55,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 10:58:55,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt... +43: [2023-04-29 10:58:55,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt... +43: [2023-04-29 10:58:55,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt... +43: [2023-04-29 10:58:55,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt... +48: [2023-04-29 10:58:55,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 10:58:55,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 10:58:55,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt... +48: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt... +33: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt... +33: [2023-04-29 10:58:55,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt... +17: [2023-04-29 10:58:55,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 10:58:55,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 10:58:55,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 10:58:55,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +48: [2023-04-29 10:58:55,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +38: [2023-04-29 10:58:55,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 10:58:55,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:55,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 10:58:55,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 10:58:55,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:55,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:55,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 10:58:55,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 10:58:55,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +40: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt... +40: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt... +40: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt... +40: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt... + 1: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 10:58:55,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt. +20: [2023-04-29 10:58:55,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +20: [2023-04-29 10:58:55,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 10:58:55,540] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 306 +26: [2023-04-29 10:58:55,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 10:58:55,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +20: [2023-04-29 10:58:55,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 10:58:55,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +25: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 10:58:55,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 10:58:55,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 10:58:55,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 10:58:55,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 10:58:55,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 10:58:55,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 10:58:55,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 10:58:55,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 10:58:55,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 10:58:55,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 10:58:55,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +22: [2023-04-29 10:58:55,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 10:58:55,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt. +44: [2023-04-29 10:58:55,552] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 358 +26: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 10:58:55,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 10:58:55,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +62: [2023-04-29 10:58:55,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt... +53: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt... +53: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt... +53: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt... + 2: [2023-04-29 10:58:55,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +22: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 10:58:55,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt. +62: [2023-04-29 10:58:55,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:55,562] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 352 +17: [2023-04-29 10:58:55,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt... + 6: [2023-04-29 10:58:55,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt... +57: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt... +10: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 10:58:55,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 10:58:55,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 10:58:55,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 10:58:55,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +57: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt... + 1: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +20: [2023-04-29 10:58:55,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 10:58:55,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt... +34: [2023-04-29 10:58:55,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt... +34: [2023-04-29 10:58:55,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt... +34: [2023-04-29 10:58:55,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt... + 1: [2023-04-29 10:58:55,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:55,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 10:58:55,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +22: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt... +36: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt... +36: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt... +22: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +36: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt... +20: [2023-04-29 10:58:55,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 10:58:55,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 10:58:55,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:55,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 10:58:55,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +51: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +15: [2023-04-29 10:58:55,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 10:58:55,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 10:58:55,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +15: [2023-04-29 10:58:55,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +62: [2023-04-29 10:58:55,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:55,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:55,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +16: [2023-04-29 10:58:55,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 10:58:55,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 10:58:55,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +45: [2023-04-29 10:58:55,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:55,589] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 362 +24: [2023-04-29 10:58:55,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 10:58:55,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +22: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +62: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +22: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:55,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:55,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 10:58:55,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 10:58:55,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt. + 7: [2023-04-29 10:58:55,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 10:58:55,596] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 356 +59: [2023-04-29 10:58:55,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:55,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:55,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 10:58:55,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt... +48: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt... +59: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt... +48: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt... +23: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +59: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 10:58:55,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +23: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +29: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +29: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +23: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +29: [2023-04-29 10:58:55,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +59: [2023-04-29 10:58:55,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 10:58:55,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +25: [2023-04-29 10:58:55,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 10:58:55,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:55,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +11: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +25: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 10:58:55,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 10:58:55,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:55,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +21: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +45: [2023-04-29 10:58:55,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:55,624] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 366 +31: [2023-04-29 10:58:55,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 10:58:55,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:55,626] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 360 + 9: [2023-04-29 10:58:55,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 10:58:55,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 10:58:55,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 10:58:55,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +29: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt. +14: [2023-04-29 10:58:55,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 10:58:55,638] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 304 + 6: [2023-04-29 10:58:55,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 10:58:55,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 10:58:55,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt. +55: [2023-04-29 10:58:55,641] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 440 +25: [2023-04-29 10:58:55,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:55,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt... +62: [2023-04-29 10:58:55,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt... +62: [2023-04-29 10:58:55,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt... +25: [2023-04-29 10:58:55,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:55,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:55,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt... +17: [2023-04-29 10:58:55,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 10:58:55,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +25: [2023-04-29 10:58:55,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:55,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +28: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +28: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +30: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +15: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt. + 5: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +27: [2023-04-29 10:58:55,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 10:58:55,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:55,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:55,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 10:58:55,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:55,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 10:58:55,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 10:58:55,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +41: [2023-04-29 10:58:55,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt. +27: [2023-04-29 10:58:55,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 10:58:55,663] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 334 +27: [2023-04-29 10:58:55,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +27: [2023-04-29 10:58:55,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:55,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 10:58:55,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:55,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 10:58:55,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 10:58:55,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:55,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +13: [2023-04-29 10:58:55,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 10:58:55,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +13: [2023-04-29 10:58:55,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 10:58:55,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +30: [2023-04-29 10:58:55,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +51: [2023-04-29 10:58:55,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +11: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:55,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +30: [2023-04-29 10:58:55,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 10:58:55,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +21: [2023-04-29 10:58:55,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 10:58:55,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +24: [2023-04-29 10:58:55,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +59: [2023-04-29 10:58:55,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:55,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 10:58:55,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:55,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +47: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:55,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:55,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:55,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:55,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 10:58:55,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 10:58:55,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 8: [2023-04-29 10:58:55,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +37: [2023-04-29 10:58:55,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 10:58:55,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 10:58:55,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt... +28: [2023-04-29 10:58:55,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 4: [2023-04-29 10:58:55,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 10:58:55,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +19: [2023-04-29 10:58:55,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +11: [2023-04-29 10:58:55,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:55,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:55,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:55,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 8: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +11: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 10:58:55,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 10:58:55,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:55,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 10:58:55,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:55,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:55,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt. +35: [2023-04-29 10:58:55,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 280 + 5: [2023-04-29 10:58:55,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 10:58:55,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:55,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt. + 3: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 10:58:55,720] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 444 +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt... +51: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt... + 5: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt... +23: [2023-04-29 10:58:55,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:55,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt... +11: [2023-04-29 10:58:55,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:55,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +59: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +59: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +21: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 1: [2023-04-29 10:58:55,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 10:58:55,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 1: [2023-04-29 10:58:55,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 10:58:55,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +23: [2023-04-29 10:58:55,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +23: [2023-04-29 10:58:55,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +18: [2023-04-29 10:58:55,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 10:58:55,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 10:58:55,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 10:58:55,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 10:58:55,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:55,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:55,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:55,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:55,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 10:58:55,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt. +58: [2023-04-29 10:58:55,745] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 470 + 3: [2023-04-29 10:58:55,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:55,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt. +30: [2023-04-29 10:58:55,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +35: [2023-04-29 10:58:55,746] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 286 +27: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 10:58:55,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:55,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 10:58:55,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 10:58:55,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +18: [2023-04-29 10:58:55,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 10:58:55,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 10:58:55,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 10:58:55,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 10:58:55,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:55,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +18: [2023-04-29 10:58:55,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 5: [2023-04-29 10:58:55,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:55,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:55,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +37: [2023-04-29 10:58:55,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +20: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 10:58:55,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt. +20: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 10:58:55,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 10:58:55,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 10:58:55,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +35: [2023-04-29 10:58:55,753] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 284 +20: [2023-04-29 10:58:55,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +30: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +59: [2023-04-29 10:58:55,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 10:58:55,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +47: [2023-04-29 10:58:55,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 10:58:55,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:55,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +28: [2023-04-29 10:58:55,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 10:58:55,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +27: [2023-04-29 10:58:55,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 10:58:55,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 10:58:55,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:55,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 10:58:55,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt. +54: [2023-04-29 10:58:55,759] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 434 +37: [2023-04-29 10:58:55,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +41: [2023-04-29 10:58:55,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt. +41: [2023-04-29 10:58:55,761] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 328 +28: [2023-04-29 10:58:55,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 10:58:55,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 10:58:55,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 10:58:55,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 10:58:55,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt. +56: [2023-04-29 10:58:55,763] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 450 +52: [2023-04-29 10:58:55,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt. +52: [2023-04-29 10:58:55,764] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 418 +37: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt... +26: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 10:58:55,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +59: [2023-04-29 10:58:55,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt... +59: [2023-04-29 10:58:55,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt... +59: [2023-04-29 10:58:55,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt... +59: [2023-04-29 10:58:55,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt... +26: [2023-04-29 10:58:55,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +30: [2023-04-29 10:58:55,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 10:58:55,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 10:58:55,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +28: [2023-04-29 10:58:55,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 10:58:55,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:55,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 10:58:55,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 10:58:55,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 10:58:55,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt. +30: [2023-04-29 10:58:55,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 10:58:55,771] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 392 +18: [2023-04-29 10:58:55,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:55,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +38: [2023-04-29 10:58:55,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt. +16: [2023-04-29 10:58:55,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +38: [2023-04-29 10:58:55,773] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 310 +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 10:58:55,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt. +63: [2023-04-29 10:58:55,775] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 510 +35: [2023-04-29 10:58:55,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 10:58:55,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 10:58:55,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 10:58:55,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +21: [2023-04-29 10:58:55,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +12: [2023-04-29 10:58:55,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 10:58:55,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 10:58:55,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +30: [2023-04-29 10:58:55,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 10:58:55,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:55,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 10:58:55,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 10:58:55,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt. +16: [2023-04-29 10:58:55,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 10:58:55,779] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 446 +12: [2023-04-29 10:58:55,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 10:58:55,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:55,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +12: [2023-04-29 10:58:55,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +12: [2023-04-29 10:58:55,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +12: [2023-04-29 10:58:55,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt. +21: [2023-04-29 10:58:55,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +21: [2023-04-29 10:58:55,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +28: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +50: [2023-04-29 10:58:55,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt. +50: [2023-04-29 10:58:55,786] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 400 + 1: [2023-04-29 10:58:55,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 10:58:55,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:55,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 10:58:55,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt. +61: [2023-04-29 10:58:55,788] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 494 + 2: [2023-04-29 10:58:55,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 10:58:55,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +63: [2023-04-29 10:58:55,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +63: [2023-04-29 10:58:55,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +63: [2023-04-29 10:58:55,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +26: [2023-04-29 10:58:55,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +36: [2023-04-29 10:58:55,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 10:58:55,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 10:58:55,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 10:58:55,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +28: [2023-04-29 10:58:55,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 10:58:55,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 10:58:55,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:55,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 10:58:55,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +13: [2023-04-29 10:58:55,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +13: [2023-04-29 10:58:55,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 10:58:55,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 10:58:55,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +13: [2023-04-29 10:58:55,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +13: [2023-04-29 10:58:55,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +13: [2023-04-29 10:58:55,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 10:58:55,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:55,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt. +37: [2023-04-29 10:58:55,807] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 302 +35: [2023-04-29 10:58:55,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 10:58:55,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 10:58:55,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:55,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 10:58:55,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 10:58:55,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 10:58:55,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 10:58:55,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 10:58:55,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:55,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 10:58:55,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:55,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +54: [2023-04-29 10:58:55,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +54: [2023-04-29 10:58:55,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +54: [2023-04-29 10:58:55,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +10: [2023-04-29 10:58:55,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +54: [2023-04-29 10:58:55,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +59: [2023-04-29 10:58:55,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:55,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 10:58:55,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:55,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 10:58:55,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +29: [2023-04-29 10:58:55,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +23: [2023-04-29 10:58:55,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:55,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 10:58:55,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 10:58:55,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 10:58:55,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 10:58:55,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 10:58:55,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +29: [2023-04-29 10:58:55,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 10:58:55,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 10:58:55,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 10:58:55,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +14: [2023-04-29 10:58:55,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 10:58:55,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt. +42: [2023-04-29 10:58:55,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 338 +52: [2023-04-29 10:58:55,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt. +52: [2023-04-29 10:58:55,840] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 422 +14: [2023-04-29 10:58:55,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 10:58:55,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 10:58:55,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 10:58:55,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:55,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:55,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 10:58:55,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 10:58:55,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt. +39: [2023-04-29 10:58:55,845] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 316 +20: [2023-04-29 10:58:55,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:55,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 10:58:55,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +42: [2023-04-29 10:58:55,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +14: [2023-04-29 10:58:55,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +42: [2023-04-29 10:58:55,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +14: [2023-04-29 10:58:55,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +42: [2023-04-29 10:58:55,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +14: [2023-04-29 10:58:55,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:55,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 10:58:55,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 10:58:55,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt. +61: [2023-04-29 10:58:55,854] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 488 +16: [2023-04-29 10:58:55,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +45: [2023-04-29 10:58:55,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:55,856] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 364 +10: [2023-04-29 10:58:55,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:55,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt. +60: [2023-04-29 10:58:55,857] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 484 + 4: [2023-04-29 10:58:55,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:55,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 10:58:55,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 10:58:55,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 10:58:55,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 10:58:55,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +13: [2023-04-29 10:58:55,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +35: [2023-04-29 10:58:55,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +35: [2023-04-29 10:58:55,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:55,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 10:58:55,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:55,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:55,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 10:58:55,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 10:58:55,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 10:58:55,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt. +46: [2023-04-29 10:58:55,874] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 370 + 4: [2023-04-29 10:58:55,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +42: [2023-04-29 10:58:55,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +13: [2023-04-29 10:58:55,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 10:58:55,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 10:58:55,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:55,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 10:58:55,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:55,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 10:58:55,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:55,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 7: [2023-04-29 10:58:55,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 10:58:55,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:55,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt. +60: [2023-04-29 10:58:55,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 10:58:55,886] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 378 +63: [2023-04-29 10:58:55,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 10:58:55,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 10:58:55,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +63: [2023-04-29 10:58:55,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 10:58:55,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 10:58:55,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:55,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 10:58:55,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +35: [2023-04-29 10:58:55,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 10:58:55,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 10:58:55,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt. +42: [2023-04-29 10:58:55,894] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 342 +63: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +63: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 10:58:55,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 10:58:55,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 10:58:55,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:55,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 10:58:55,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 10:58:55,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:55,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +12: [2023-04-29 10:58:55,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 10:58:55,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt. +43: [2023-04-29 10:58:55,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 348 +36: [2023-04-29 10:58:55,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 10:58:55,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 10:58:55,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt. +62: [2023-04-29 10:58:55,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +62: [2023-04-29 10:58:55,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +62: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +26: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 10:58:55,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:55,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +12: [2023-04-29 10:58:55,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 10:58:55,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 10:58:55,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 10:58:55,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 10:58:55,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 10:58:55,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... +12: [2023-04-29 10:58:55,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:55,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:55,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 10:58:55,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 10:58:55,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 10:58:55,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 10:58:55,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 10:58:55,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 7: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:55,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 10:58:55,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt. + 6: [2023-04-29 10:58:55,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 10:58:55,917] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 486 + 6: [2023-04-29 10:58:55,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +60: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +54: [2023-04-29 10:58:55,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 10:58:55,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:55,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt. +54: [2023-04-29 10:58:55,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 10:58:55,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +44: [2023-04-29 10:58:55,920] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 354 + 2: [2023-04-29 10:58:55,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 10:58:55,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 2: [2023-04-29 10:58:55,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 10:58:55,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 10:58:55,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +57: [2023-04-29 10:58:55,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:55,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 460 + 2: [2023-04-29 10:58:55,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 10:58:55,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 10:58:55,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt. +29: [2023-04-29 10:58:55,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 10:58:55,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 260 + 4: [2023-04-29 10:58:55,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 10:58:55,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 0: [2023-04-29 10:58:55,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:55,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 10:58:55,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:55,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:55,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:55,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +42: [2023-04-29 10:58:55,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 10:58:55,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:55,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 10:58:55,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:55,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:55,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:55,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:55,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:55,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 10:58:55,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 10:58:55,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 10:58:55,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 10:58:55,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 10:58:55,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:55,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt. +47: [2023-04-29 10:58:55,954] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 376 +42: [2023-04-29 10:58:55,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 10:58:55,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:55,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt. +52: [2023-04-29 10:58:55,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 416 +30: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:55,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:55,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 10:58:55,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:55,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:55,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:55,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +34: [2023-04-29 10:58:55,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt. +34: [2023-04-29 10:58:55,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 276 +57: [2023-04-29 10:58:55,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:55,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 462 + 6: [2023-04-29 10:58:55,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 10:58:55,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 10:58:55,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 10:58:55,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 10:58:55,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +60: [2023-04-29 10:58:55,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 4: [2023-04-29 10:58:55,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 10:58:55,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:55,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +43: [2023-04-29 10:58:55,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt. +43: [2023-04-29 10:58:55,982] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 344 +53: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt. +26: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 10:58:55,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 10:58:55,984] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 292 + 4: [2023-04-29 10:58:55,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 10:58:55,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt. +55: [2023-04-29 10:58:55,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:55,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 272 +26: [2023-04-29 10:58:55,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 10:58:55,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:55,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:55,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:55,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 10:58:55,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 10:58:55,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 10:58:55,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +41: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +41: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +41: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt. +55: [2023-04-29 10:58:55,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:55,993] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 266 +43: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 10:58:55,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 10:58:55,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:55,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 10:58:55,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 6: [2023-04-29 10:58:55,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 10:58:55,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 10:58:56,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 10:58:56,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:56,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:56,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +61: [2023-04-29 10:58:56,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +61: [2023-04-29 10:58:56,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +61: [2023-04-29 10:58:56,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +31: [2023-04-29 10:58:56,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 10:58:56,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +53: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +31: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 10:58:56,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 10:58:56,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:56,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +56: [2023-04-29 10:58:56,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt. +56: [2023-04-29 10:58:56,010] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 454 +53: [2023-04-29 10:58:56,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:56,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 10:58:56,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 10:58:56,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 10:58:56,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:56,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:56,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +62: [2023-04-29 10:58:56,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 10:58:56,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 10:58:56,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 10:58:56,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:56,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 10:58:56,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 10:58:56,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:56,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 10:58:56,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:56,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +43: [2023-04-29 10:58:56,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 10:58:56,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +43: [2023-04-29 10:58:56,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:56,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 10:58:56,028] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 380 + 6: [2023-04-29 10:58:56,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 10:58:56,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:56,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:56,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:56,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 10:58:56,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 10:58:56,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:56,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:56,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:56,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 10:58:56,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 10:58:56,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt. +42: [2023-04-29 10:58:56,042] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 340 + 6: [2023-04-29 10:58:56,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 10:58:56,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 10:58:56,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 10:58:56,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:56,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt. +33: [2023-04-29 10:58:56,044] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 268 +32: [2023-04-29 10:58:56,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:56,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 10:58:56,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +52: [2023-04-29 10:58:56,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +52: [2023-04-29 10:58:56,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +52: [2023-04-29 10:58:56,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +52: [2023-04-29 10:58:56,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:56,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:56,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:56,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 10:58:56,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 10:58:56,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 10:58:56,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 10:58:56,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 10:58:56,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 10:58:56,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 10:58:56,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 10:58:56,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 10:58:56,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:56,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:56,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:56,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 10:58:56,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 10:58:56,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 10:58:56,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 10:58:56,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +40: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +57: [2023-04-29 10:58:56,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +30: [2023-04-29 10:58:56,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +55: [2023-04-29 10:58:56,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:56,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 10:58:56,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 10:58:56,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +30: [2023-04-29 10:58:56,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +40: [2023-04-29 10:58:56,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:56,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 10:58:56,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 10:58:56,064] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 320 +51: [2023-04-29 10:58:56,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 10:58:56,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +30: [2023-04-29 10:58:56,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +51: [2023-04-29 10:58:56,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 10:58:56,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:56,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:56,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 10:58:56,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 10:58:56,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +55: [2023-04-29 10:58:56,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +55: [2023-04-29 10:58:56,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +34: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 10:58:56,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 10:58:56,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:56,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 10:58:56,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:56,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 10:58:56,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 10:58:56,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 10:58:56,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 10:58:56,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 10:58:56,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:56,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +52: [2023-04-29 10:58:56,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +52: [2023-04-29 10:58:56,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 10:58:56,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:56,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:56,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 10:58:56,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:56,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +53: [2023-04-29 10:58:56,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:56,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:56,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:56,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:56,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:56,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:56,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:56,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 10:58:56,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 10:58:56,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 10:58:56,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:56,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:56,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +53: [2023-04-29 10:58:56,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 10:58:56,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +41: [2023-04-29 10:58:56,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +41: [2023-04-29 10:58:56,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 10:58:56,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +11: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt. +62: [2023-04-29 10:58:56,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 500 + 0: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 10:58:56,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 10:58:56,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 10:58:56,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt. + 0: [2023-04-29 10:58:56,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +53: [2023-04-29 10:58:56,091] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 426 +43: [2023-04-29 10:58:56,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 0: [2023-04-29 10:58:56,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +62: [2023-04-29 10:58:56,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt. +62: [2023-04-29 10:58:56,091] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 498 +41: [2023-04-29 10:58:56,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 10:58:56,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 10:58:56,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 10:58:56,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:56,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 10:58:56,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 10:58:56,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:56,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:56,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 10:58:56,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 10:58:56,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 10:58:56,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:56,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 10:58:56,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 10:58:56,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:56,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:56,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 10:58:56,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:56,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:56,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:56,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 10:58:56,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 10:58:56,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:56,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:56,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:56,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:56,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 10:58:56,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 10:58:56,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 10:58:56,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt. +61: [2023-04-29 10:58:56,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 10:58:56,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:56,103] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 398 +61: [2023-04-29 10:58:56,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +15: [2023-04-29 10:58:56,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 10:58:56,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 10:58:56,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 10:58:56,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +33: [2023-04-29 10:58:56,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 10:58:56,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:56,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:56,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 10:58:56,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 10:58:56,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +43: [2023-04-29 10:58:56,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 10:58:56,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 10:58:56,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +32: [2023-04-29 10:58:56,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +45: [2023-04-29 10:58:56,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 10:58:56,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +45: [2023-04-29 10:58:56,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +45: [2023-04-29 10:58:56,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:56,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 10:58:56,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 10:58:56,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 10:58:56,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +17: [2023-04-29 10:58:56,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 10:58:56,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 10:58:56,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 10:58:56,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 10:58:56,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 10:58:56,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +45: [2023-04-29 10:58:56,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +32: [2023-04-29 10:58:56,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:56,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 10:58:56,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +24: [2023-04-29 10:58:56,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +24: [2023-04-29 10:58:56,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 10:58:56,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 10:58:56,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +57: [2023-04-29 10:58:56,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 10:58:56,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +32: [2023-04-29 10:58:56,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 10:58:56,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 10:58:56,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 10:58:56,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 10:58:56,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 10:58:56,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt. +50: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +50: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +50: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +15: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 10:58:56,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +22: [2023-04-29 10:58:56,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 10:58:56,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 10:58:56,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +32: [2023-04-29 10:58:56,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +22: [2023-04-29 10:58:56,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 10:58:56,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 10:58:56,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:56,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:56,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:56,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +15: [2023-04-29 10:58:56,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 10:58:56,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +17: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +39: [2023-04-29 10:58:56,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:56,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:56,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:56,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:56,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 10:58:56,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 10:58:56,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 10:58:56,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 10:58:56,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:56,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 10:58:56,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 10:58:56,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 10:58:56,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +44: [2023-04-29 10:58:56,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 10:58:56,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 10:58:56,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +10: [2023-04-29 10:58:56,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 10:58:56,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 10:58:56,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 10:58:56,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +24: [2023-04-29 10:58:56,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:56,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 10:58:56,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 10:58:56,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 10:58:56,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 10:58:56,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 10:58:56,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:56,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 10:58:56,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:56,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 10:58:56,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +33: [2023-04-29 10:58:56,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:56,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 10:58:56,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 10:58:56,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 10:58:56,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:56,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 10:58:56,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 10:58:56,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 10:58:56,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 10:58:56,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 10:58:56,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:56,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 10:58:56,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 10:58:56,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +10: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +49: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +49: [2023-04-29 10:58:56,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:56,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +22: [2023-04-29 10:58:56,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 10:58:56,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 10:58:56,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +52: [2023-04-29 10:58:56,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 10:58:56,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +10: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +10: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +22: [2023-04-29 10:58:56,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 10:58:56,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +33: [2023-04-29 10:58:56,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 10:58:56,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 10:58:56,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 10:58:56,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 10:58:56,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:56,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 10:58:56,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 10:58:56,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 10:58:56,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 10:58:56,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:56,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 10:58:56,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 10:58:56,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:56,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 10:58:56,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 10:58:56,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 10:58:56,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 10:58:56,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 10:58:56,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 10:58:56,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +33: [2023-04-29 10:58:56,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 0: [2023-04-29 10:58:56,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 10:58:56,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 10:58:56,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 10:58:56,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 10:58:56,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 10:58:56,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 10:58:56,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 10:58:56,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 10:58:56,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 10:58:56,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +48: [2023-04-29 10:58:56,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +48: [2023-04-29 10:58:56,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 10:58:56,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:56,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:56,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +34: [2023-04-29 10:58:56,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +48: [2023-04-29 10:58:56,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 10:58:56,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 10:58:56,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 10:58:56,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 10:58:56,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 10:58:56,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 10:58:56,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +47: [2023-04-29 10:58:56,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 10:58:56,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 10:58:56,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 10:58:56,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 10:58:56,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 0: [2023-04-29 10:58:56,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 0: [2023-04-29 10:58:56,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 0: [2023-04-29 10:58:56,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +58: [2023-04-29 10:58:56,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:56,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:56,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:56,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:56,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 10:58:56,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +39: [2023-04-29 10:58:56,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:56,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:56,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 10:58:56,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:56,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 10:58:56,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:56,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:56,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 10:58:56,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 10:58:56,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +39: [2023-04-29 10:58:56,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +48: [2023-04-29 10:58:56,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 10:58:56,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +50: [2023-04-29 10:58:56,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 10:58:56,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 10:58:56,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:56,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 10:58:56,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt. +58: [2023-04-29 10:58:56,223] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 464 +12: [2023-04-29 10:58:56,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 10:58:56,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 10:58:56,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 10:58:56,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... +50: [2023-04-29 10:58:56,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:56,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 10:58:56,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt. +12: [2023-04-29 10:58:56,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 10:58:56,227] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 474 +50: [2023-04-29 10:58:56,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 10:58:56,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 10:58:56,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 10:58:56,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:56,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +59: [2023-04-29 10:58:56,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt. +59: [2023-04-29 10:58:56,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 476 +50: [2023-04-29 10:58:56,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +56: [2023-04-29 10:58:56,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 10:58:56,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +56: [2023-04-29 10:58:56,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 10:58:56,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt. +50: [2023-04-29 10:58:56,254] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 402 + 4: [2023-04-29 10:58:56,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +32: [2023-04-29 10:58:56,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt. +32: [2023-04-29 10:58:56,255] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 258 +56: [2023-04-29 10:58:56,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:56,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 10:58:56,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +51: [2023-04-29 10:58:56,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt. +51: [2023-04-29 10:58:56,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 414 +56: [2023-04-29 10:58:56,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +56: [2023-04-29 10:58:56,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:56,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +56: [2023-04-29 10:58:56,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 10:58:56,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:56,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +58: [2023-04-29 10:58:56,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:56,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:56,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt. +48: [2023-04-29 10:58:56,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 10:58:56,272] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 472 +58: [2023-04-29 10:58:56,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +37: [2023-04-29 10:58:56,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 10:58:56,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 10:58:56,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 10:58:56,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +37: [2023-04-29 10:58:56,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +48: [2023-04-29 10:58:56,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +37: [2023-04-29 10:58:56,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 10:58:56,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 10:58:56,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 10:58:56,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +48: [2023-04-29 10:58:56,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:56,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 10:58:56,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +37: [2023-04-29 10:58:56,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:56,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:56,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:56,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:56,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 10:58:56,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 10:58:56,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 10:58:56,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 10:58:56,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +37: [2023-04-29 10:58:56,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:56,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 10:58:56,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:56,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 10:58:56,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:56,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 10:58:56,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 10:58:56,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:56,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:56,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:56,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:56,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:56,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:56,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:56,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 10:58:56,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt... + 5: [2023-04-29 10:58:56,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +18: [2023-04-29 10:58:56,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +18: [2023-04-29 10:58:56,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +18: [2023-04-29 10:58:56,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +41: [2023-04-29 10:58:56,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt. +41: [2023-04-29 10:58:56,324] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 332 +23: [2023-04-29 10:58:56,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +23: [2023-04-29 10:58:56,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +23: [2023-04-29 10:58:56,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +23: [2023-04-29 10:58:56,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +51: [2023-04-29 10:58:56,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt. +51: [2023-04-29 10:58:56,327] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 408 +60: [2023-04-29 10:58:56,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt. +60: [2023-04-29 10:58:56,343] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 482 +25: [2023-04-29 10:58:56,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +25: [2023-04-29 10:58:56,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +25: [2023-04-29 10:58:56,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +25: [2023-04-29 10:58:56,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +40: [2023-04-29 10:58:56,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt. +40: [2023-04-29 10:58:56,346] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 326 +18: [2023-04-29 10:58:56,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 10:58:56,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 10:58:56,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 10:58:56,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +18: [2023-04-29 10:58:56,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 10:58:56,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt. +54: [2023-04-29 10:58:56,351] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 436 +18: [2023-04-29 10:58:56,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 10:58:56,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt. +61: [2023-04-29 10:58:56,353] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 492 +23: [2023-04-29 10:58:56,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 10:58:56,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt. +63: [2023-04-29 10:58:56,366] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 506 +24: [2023-04-29 10:58:56,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 10:58:56,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 10:58:56,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt. +48: [2023-04-29 10:58:56,388] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 388 +11: [2023-04-29 10:58:56,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 10:58:56,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt. +40: [2023-04-29 10:58:56,394] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 324 +61: [2023-04-29 10:58:56,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt. +61: [2023-04-29 10:58:56,395] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 490 +63: [2023-04-29 10:58:56,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt. +63: [2023-04-29 10:58:56,397] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 508 +25: [2023-04-29 10:58:56,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:56,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +12: [2023-04-29 10:58:56,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +12: [2023-04-29 10:58:56,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +12: [2023-04-29 10:58:56,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt. +13: [2023-04-29 10:58:56,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +13: [2023-04-29 10:58:56,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +13: [2023-04-29 10:58:56,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +13: [2023-04-29 10:58:56,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +41: [2023-04-29 10:58:56,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt. +41: [2023-04-29 10:58:56,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 330 +47: [2023-04-29 10:58:56,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt. +47: [2023-04-29 10:58:56,433] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 382 +24: [2023-04-29 10:58:56,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:56,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:56,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 10:58:56,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 10:58:56,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt. +52: [2023-04-29 10:58:56,442] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 420 +13: [2023-04-29 10:58:56,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 10:58:56,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:56,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:56,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 10:58:56,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 10:58:56,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt. +63: [2023-04-29 10:58:56,455] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 504 +49: [2023-04-29 10:58:56,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt. +49: [2023-04-29 10:58:56,456] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 396 +25: [2023-04-29 10:58:56,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 10:58:56,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt. +31: [2023-04-29 10:58:56,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 10:58:56,462] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 300 +31: [2023-04-29 10:58:56,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 10:58:56,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 10:58:56,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 10:58:56,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:56,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +19: [2023-04-29 10:58:56,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 10:58:56,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 10:58:56,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:56,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 10:58:56,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 10:58:56,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 10:58:56,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 10:58:56,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 10:58:56,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:56,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 10:58:56,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt. +53: [2023-04-29 10:58:56,476] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 430 + 3: [2023-04-29 10:58:56,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:56,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:56,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:56,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:56,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +50: [2023-04-29 10:58:56,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt. +50: [2023-04-29 10:58:56,508] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 406 +20: [2023-04-29 10:58:56,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 10:58:56,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 10:58:56,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 10:58:56,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 10:58:56,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:56,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +50: [2023-04-29 10:58:56,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt. +50: [2023-04-29 10:58:56,512] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 404 + 2: [2023-04-29 10:58:56,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 10:58:56,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +12: [2023-04-29 10:58:56,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 10:58:56,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:56,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 3: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 3: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 10:58:56,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 10:58:56,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 10:58:56,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 10:58:56,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 10:58:56,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:56,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:56,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:56,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:56,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:56,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:56,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:56,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:56,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:56,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 10:58:56,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 10:58:56,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 10:58:56,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:56,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +63: [2023-04-29 10:58:56,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +63: [2023-04-29 10:58:56,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +63: [2023-04-29 10:58:56,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +22: [2023-04-29 10:58:56,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 10:58:56,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:56,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:56,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:56,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 10:58:56,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 10:58:56,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 10:58:56,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 10:58:56,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 10:58:56,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 10:58:56,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 7: [2023-04-29 10:58:56,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 7: [2023-04-29 10:58:56,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 7: [2023-04-29 10:58:56,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +30: [2023-04-29 10:58:56,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:56,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 10:58:56,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 10:58:56,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 10:58:56,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:56,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:56,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:56,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:56,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 10:58:56,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt. + 0: [2023-04-29 10:58:56,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 10:58:56,603] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 270 + 0: [2023-04-29 10:58:56,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:56,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:56,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:56,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:56,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:56,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 10:58:56,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:56,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:56,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +28: [2023-04-29 10:58:56,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +28: [2023-04-29 10:58:56,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +28: [2023-04-29 10:58:56,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 10:58:56,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 10:58:56,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt. +32: [2023-04-29 10:58:56,619] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 262 + 5: [2023-04-29 10:58:56,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:56,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 10:58:56,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt. + 1: [2023-04-29 10:58:56,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 10:58:56,623] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 438 +15: [2023-04-29 10:58:56,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +15: [2023-04-29 10:58:56,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 10:58:56,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:56,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +23: [2023-04-29 10:58:56,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:56,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 10:58:56,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 10:58:56,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +10: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:56,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:56,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:56,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 10:58:56,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +23: [2023-04-29 10:58:56,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 10:58:56,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +23: [2023-04-29 10:58:56,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:56,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:56,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 10:58:56,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:56,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt. + 3: [2023-04-29 10:58:56,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 10:58:56,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +36: [2023-04-29 10:58:56,643] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 288 +63: [2023-04-29 10:58:56,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +28: [2023-04-29 10:58:56,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:56,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 10:58:56,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:56,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:56,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:56,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:56,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +26: [2023-04-29 10:58:56,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +63: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +12: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt. +26: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 10:58:56,651] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 372 + 9: [2023-04-29 10:58:56,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:56,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 10:58:56,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:56,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:56,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 10:58:56,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt. +46: [2023-04-29 10:58:56,655] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 374 +12: [2023-04-29 10:58:56,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:56,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +22: [2023-04-29 10:58:56,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 10:58:56,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 10:58:56,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt. +35: [2023-04-29 10:58:56,664] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 282 +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:56,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:56,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +18: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:56,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 10:58:56,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 10:58:56,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +58: [2023-04-29 10:58:56,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt. +58: [2023-04-29 10:58:56,677] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 466 +26: [2023-04-29 10:58:56,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 10:58:56,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:56,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:56,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 10:58:56,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +35: [2023-04-29 10:58:56,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +35: [2023-04-29 10:58:56,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +35: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +57: [2023-04-29 10:58:56,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:56,685] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 456 +26: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt. + 7: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +14: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 10:58:56,686] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 322 +26: [2023-04-29 10:58:56,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:56,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:56,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:56,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 10:58:56,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 10:58:56,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 10:58:56,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:56,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:56,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 10:58:56,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 10:58:56,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 10:58:56,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 10:58:56,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 10:58:56,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 10:58:56,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +21: [2023-04-29 10:58:56,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:56,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:56,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +57: [2023-04-29 10:58:56,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt. +57: [2023-04-29 10:58:56,704] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 458 +35: [2023-04-29 10:58:56,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 10:58:56,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +53: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 1: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +53: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +28: [2023-04-29 10:58:56,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 10:58:56,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:56,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:56,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 10:58:56,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:56,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 10:58:56,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 10:58:56,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 10:58:56,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:56,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 10:58:56,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:56,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 10:58:56,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt. +20: [2023-04-29 10:58:56,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 10:58:56,715] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 428 +16: [2023-04-29 10:58:56,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:56,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:56,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:56,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:56,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:56,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:56,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +32: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +32: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +28: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +16: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 10:58:56,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +43: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +43: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +28: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +43: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +12: [2023-04-29 10:58:56,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:56,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 10:58:56,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:56,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 10:58:56,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:56,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 10:58:56,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 10:58:56,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 7: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 10:58:56,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:56,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +12: [2023-04-29 10:58:56,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:56,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 10:58:56,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:56,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 10:58:56,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 9: [2023-04-29 10:58:56,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 10:58:56,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 10:58:56,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:56,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 10:58:56,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 10:58:56,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 10:58:56,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 10:58:56,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 10:58:56,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt. +39: [2023-04-29 10:58:56,736] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 314 +27: [2023-04-29 10:58:56,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:56,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 10:58:56,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 10:58:56,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 10:58:56,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +58: [2023-04-29 10:58:56,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt. +58: [2023-04-29 10:58:56,743] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 468 +26: [2023-04-29 10:58:56,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:56,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:56,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 10:58:56,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +43: [2023-04-29 10:58:56,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 10:58:56,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 10:58:56,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:56,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:56,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 10:58:56,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 10:58:56,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:56,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 10:58:56,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 10:58:56,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:56,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 10:58:56,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +61: [2023-04-29 10:58:56,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 6: [2023-04-29 10:58:56,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 10:58:56,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +61: [2023-04-29 10:58:56,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 10:58:56,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 10:58:56,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:56,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:56,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 10:58:56,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 10:58:56,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +42: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +42: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 10:58:56,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:56,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 10:58:56,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 10:58:56,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 10:58:56,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 10:58:56,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +18: [2023-04-29 10:58:56,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 10:58:56,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:56,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt. +27: [2023-04-29 10:58:56,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:56,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 290 +26: [2023-04-29 10:58:56,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +18: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 10:58:56,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:56,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 10:58:56,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:56,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 10:58:56,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 10:58:56,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 10:58:56,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:56,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 10:58:56,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 10:58:56,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 10:58:56,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt. +48: [2023-04-29 10:58:56,775] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 384 +28: [2023-04-29 10:58:56,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 10:58:56,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +39: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 10:58:56,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:56,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 10:58:56,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt. +59: [2023-04-29 10:58:56,782] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 478 +61: [2023-04-29 10:58:56,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:56,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:56,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 10:58:56,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:56,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:56,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 6: [2023-04-29 10:58:56,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:56,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:56,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 10:58:56,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt. +62: [2023-04-29 10:58:56,786] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 502 +35: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +36: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 10:58:56,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 10:58:56,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +16: [2023-04-29 10:58:56,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:56,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:56,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 6: [2023-04-29 10:58:56,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 10:58:56,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 10:58:56,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +26: [2023-04-29 10:58:56,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 10:58:56,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:56,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 10:58:56,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 10:58:56,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 10:58:56,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 10:58:56,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +16: [2023-04-29 10:58:56,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +36: [2023-04-29 10:58:56,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 10:58:56,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 10:58:56,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:56,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 10:58:56,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 10:58:56,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:56,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 10:58:56,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 10:58:56,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:56,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt. +56: [2023-04-29 10:58:56,801] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 452 +20: [2023-04-29 10:58:56,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 10:58:56,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +36: [2023-04-29 10:58:56,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 10:58:56,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 10:58:56,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 10:58:56,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +39: [2023-04-29 10:58:56,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:56,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 10:58:56,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:56,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +20: [2023-04-29 10:58:56,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 10:58:56,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 10:58:56,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 10:58:56,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 10:58:56,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 10:58:56,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 10:58:56,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +20: [2023-04-29 10:58:56,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 10:58:56,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +51: [2023-04-29 10:58:56,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +51: [2023-04-29 10:58:56,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 10:58:56,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:56,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +51: [2023-04-29 10:58:56,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +28: [2023-04-29 10:58:56,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 10:58:56,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 10:58:56,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 10:58:56,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 10:58:56,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 10:58:56,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:56,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:56,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:56,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +33: [2023-04-29 10:58:56,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +33: [2023-04-29 10:58:56,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +33: [2023-04-29 10:58:56,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 10:58:56,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 10:58:56,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +45: [2023-04-29 10:58:56,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 10:58:56,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 10:58:56,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 10:58:56,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 10:58:56,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:56,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 10:58:56,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:56,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:56,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 10:58:56,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 10:58:56,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:56,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 10:58:56,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt. +51: [2023-04-29 10:58:56,823] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 412 +54: [2023-04-29 10:58:56,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 10:58:56,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:56,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:56,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +60: [2023-04-29 10:58:56,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 10:58:56,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 10:58:56,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +54: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 10:58:56,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:56,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:56,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +32: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 10:58:56,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 10:58:56,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +55: [2023-04-29 10:58:56,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:56,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 10:58:56,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 4: [2023-04-29 10:58:56,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 10:58:56,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 10:58:56,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:56,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +60: [2023-04-29 10:58:56,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 10:58:56,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:56,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +60: [2023-04-29 10:58:56,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +60: [2023-04-29 10:58:56,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +61: [2023-04-29 10:58:56,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 10:58:56,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +33: [2023-04-29 10:58:56,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:56,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:56,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:56,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 10:58:56,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:56,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +55: [2023-04-29 10:58:56,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:56,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:56,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:56,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:56,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 10:58:56,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:56,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 10:58:56,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 10:58:56,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 10:58:56,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 10:58:56,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt. +55: [2023-04-29 10:58:56,852] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 442 +45: [2023-04-29 10:58:56,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:56,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 10:58:56,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +55: [2023-04-29 10:58:56,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +61: [2023-04-29 10:58:56,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +61: [2023-04-29 10:58:56,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +61: [2023-04-29 10:58:56,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +39: [2023-04-29 10:58:56,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 10:58:56,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 10:58:56,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 10:58:56,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 10:58:56,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 10:58:56,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +39: [2023-04-29 10:58:56,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +58: [2023-04-29 10:58:56,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 10:58:56,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 10:58:56,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 10:58:56,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 10:58:56,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +39: [2023-04-29 10:58:56,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:56,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 10:58:56,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +21: [2023-04-29 10:58:56,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 10:58:56,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 10:58:56,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 10:58:56,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +39: [2023-04-29 10:58:56,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 10:58:56,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 10:58:56,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 10:58:56,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:56,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 10:58:56,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 10:58:56,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 10:58:56,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 10:58:56,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 10:58:56,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 10:58:56,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 10:58:56,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 10:58:56,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 10:58:56,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +38: [2023-04-29 10:58:56,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 10:58:56,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +62: [2023-04-29 10:58:56,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 10:58:56,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +34: [2023-04-29 10:58:56,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 10:58:56,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 10:58:56,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 10:58:56,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 10:58:56,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +33: [2023-04-29 10:58:56,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:56,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +48: [2023-04-29 10:58:56,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 10:58:56,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +48: [2023-04-29 10:58:56,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 10:58:56,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +48: [2023-04-29 10:58:56,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 10:58:56,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 10:58:56,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 10:58:56,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:56,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +58: [2023-04-29 10:58:56,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:56,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 10:58:56,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 10:58:56,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 10:58:56,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +14: [2023-04-29 10:58:56,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 10:58:56,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +14: [2023-04-29 10:58:56,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 10:58:56,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 10:58:56,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt. +60: [2023-04-29 10:58:56,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 480 +21: [2023-04-29 10:58:56,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +51: [2023-04-29 10:58:56,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +21: [2023-04-29 10:58:56,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 10:58:56,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 10:58:56,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:56,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 10:58:56,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 10:58:56,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 10:58:56,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 10:58:56,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:56,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 10:58:56,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 10:58:56,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:56,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:56,915] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 432 +51: [2023-04-29 10:58:56,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 10:58:56,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 10:58:56,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 10:58:56,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 10:58:56,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 10:58:56,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:56,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 10:58:56,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:56,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 10:58:56,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 10:58:56,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:56,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +45: [2023-04-29 10:58:56,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 10:58:56,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:56,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:56,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 10:58:56,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:56,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +62: [2023-04-29 10:58:56,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:56,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:56,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:56,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:56,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt. +38: [2023-04-29 10:58:56,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 10:58:56,925] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 336 +34: [2023-04-29 10:58:56,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:56,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 10:58:56,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +38: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +33: [2023-04-29 10:58:56,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +34: [2023-04-29 10:58:56,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 10:58:56,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +45: [2023-04-29 10:58:56,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 10:58:56,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:56,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 10:58:56,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:56,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:56,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:56,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 10:58:56,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:56,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:56,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 10:58:56,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:56,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:56,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 10:58:56,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:56,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:56,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:56,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 10:58:56,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt. +48: [2023-04-29 10:58:56,940] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 390 +57: [2023-04-29 10:58:56,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 10:58:56,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:56,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 10:58:56,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:56,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:56,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:56,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 10:58:56,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:56,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 10:58:56,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 10:58:56,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 10:58:56,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 10:58:56,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +57: [2023-04-29 10:58:56,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 10:58:56,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 10:58:56,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 10:58:56,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 10:58:56,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 10:58:56,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 10:58:56,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +37: [2023-04-29 10:58:56,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +24: [2023-04-29 10:58:56,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 10:58:56,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:56,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 10:58:56,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 10:58:56,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 10:58:56,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +58: [2023-04-29 10:58:56,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:56,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +11: [2023-04-29 10:58:56,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:56,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:56,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:56,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 10:58:56,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:56,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 10:58:56,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 10:58:56,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:56,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 10:58:56,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:56,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 10:58:56,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 10:58:56,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 10:58:56,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 10:58:56,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 10:58:56,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +46: [2023-04-29 10:58:56,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +58: [2023-04-29 10:58:56,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 10:58:56,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 10:58:56,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +38: [2023-04-29 10:58:56,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 10:58:56,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 10:58:56,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 10:58:56,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +14: [2023-04-29 10:58:56,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +49: [2023-04-29 10:58:56,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:56,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 10:58:56,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +48: [2023-04-29 10:58:56,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:56,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 10:58:56,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +46: [2023-04-29 10:58:56,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:56,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +25: [2023-04-29 10:58:56,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 10:58:56,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +38: [2023-04-29 10:58:56,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 10:58:56,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +46: [2023-04-29 10:58:56,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 10:58:56,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 10:58:56,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 10:58:56,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 10:58:56,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +62: [2023-04-29 10:58:56,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:56,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 10:58:56,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +21: [2023-04-29 10:58:56,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +34: [2023-04-29 10:58:56,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:56,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +62: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +46: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 10:58:56,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 10:58:56,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +25: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:56,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +62: [2023-04-29 10:58:56,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 10:58:56,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:56,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:56,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +31: [2023-04-29 10:58:56,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 10:58:56,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 10:58:56,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. + 2: [2023-04-29 10:58:56,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +34: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +31: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +62: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:56,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:56,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:56,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:56,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:56,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +25: [2023-04-29 10:58:56,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:56,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +62: [2023-04-29 10:58:57,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:57,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:57,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 10:58:57,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 10:58:57,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 10:58:57,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:57,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 10:58:57,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 10:58:57,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 10:58:57,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 10:58:57,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:57,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 10:58:57,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 10:58:57,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +38: [2023-04-29 10:58:57,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +62: [2023-04-29 10:58:57,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 10:58:57,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 10:58:57,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 10:58:57,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 10:58:57,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:57,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +31: [2023-04-29 10:58:57,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 10:58:57,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:57,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 10:58:57,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 10:58:57,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 10:58:57,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 10:58:57,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 10:58:57,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +34: [2023-04-29 10:58:57,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:57,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:57,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 10:58:57,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 10:58:57,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 10:58:57,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:57,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 10:58:57,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:57,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:57,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 10:58:57,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 10:58:57,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 10:58:57,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +34: [2023-04-29 10:58:57,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 10:58:57,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 10:58:57,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 10:58:57,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 10:58:57,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 10:58:57,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 10:58:57,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 10:58:57,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt. +56: [2023-04-29 10:58:57,023] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 448 +57: [2023-04-29 10:58:57,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 10:58:57,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 10:58:57,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 10:58:57,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +25: [2023-04-29 10:58:57,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 10:58:57,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt. +51: [2023-04-29 10:58:57,030] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 410 +31: [2023-04-29 10:58:57,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 10:58:57,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 10:58:57,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 10:58:57,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 10:58:57,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:57,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +11: [2023-04-29 10:58:57,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 10:58:57,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt. +49: [2023-04-29 10:58:57,041] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 394 +17: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:57,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +62: [2023-04-29 10:58:57,055] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 498 +25: [2023-04-29 10:58:57,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:57,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 10:58:57,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +25: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 10:58:57,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:57,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:57,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:57,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:57,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +62: [2023-04-29 10:58:57,077] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 502 +62: [2023-04-29 10:58:57,078] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 500 + 5: [2023-04-29 10:58:57,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,083] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 344 +17: [2023-04-29 10:58:57,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 10:58:57,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 10:58:57,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 10:58:57,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 10:58:57,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 10:58:57,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 10:58:57,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 10:58:57,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 10:58:57,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 10:58:57,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +24: [2023-04-29 10:58:57,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,096] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 348 +24: [2023-04-29 10:58:57,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +24: [2023-04-29 10:58:57,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 10:58:57,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:57,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 10:58:57,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:57,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:57,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +11: [2023-04-29 10:58:57,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 10:58:57,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 10:58:57,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 10:58:57,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +34: [2023-04-29 10:58:57,100] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 272 +31: [2023-04-29 10:58:57,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:57,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 3: [2023-04-29 10:58:57,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 10:58:57,105] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 276 +22: [2023-04-29 10:58:57,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 10:58:57,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 10:58:57,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 10:58:57,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:57,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +30: [2023-04-29 10:58:57,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +30: [2023-04-29 10:58:57,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +30: [2023-04-29 10:58:57,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +31: [2023-04-29 10:58:57,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 10:58:57,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:57,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 10:58:57,122] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 458 +57: [2023-04-29 10:58:57,122] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 462 +57: [2023-04-29 10:58:57,123] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 460 +11: [2023-04-29 10:58:57,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 10:58:57,125] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 456 +19: [2023-04-29 10:58:57,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:57,127] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 506 +11: [2023-04-29 10:58:57,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:57,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:57,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:57,133] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 504 + 2: [2023-04-29 10:58:57,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-04-29 10:58:57,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... + 2: [2023-04-29 10:58:57,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 2: [2023-04-29 10:58:57,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... +31: [2023-04-29 10:58:57,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:57,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... +11: [2023-04-29 10:58:57,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... +11: [2023-04-29 10:58:57,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... +11: [2023-04-29 10:58:57,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... +63: [2023-04-29 10:58:57,135] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 510 + 5: [2023-04-29 10:58:57,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 10:58:57,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 10:58:57,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 10:58:57,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 10:58:57,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 10:58:57,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 10:58:57,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +17: [2023-04-29 10:58:57,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +63: [2023-04-29 10:58:57,151] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 508 +25: [2023-04-29 10:58:57,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +25: [2023-04-29 10:58:57,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... + 5: [2023-04-29 10:58:57,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 10:58:57,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +25: [2023-04-29 10:58:57,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... + 1: [2023-04-29 10:58:57,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 10:58:57,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +27: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +27: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:57,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 10:58:57,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +13: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:57,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +13: [2023-04-29 10:58:57,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 10:58:57,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:57,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 7: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 10:58:57,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +62: [2023-04-29 10:58:57,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt. +62: [2023-04-29 10:58:57,168] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 496 + 0: [2023-04-29 10:58:57,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:57,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 10:58:57,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +31: [2023-04-29 10:58:57,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +31: [2023-04-29 10:58:57,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +31: [2023-04-29 10:58:57,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... + 4: [2023-04-29 10:58:57,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 10:58:57,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 10:58:57,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +62: [2023-04-29 10:58:57,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 496 +18: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 10:58:57,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 10:58:57,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 10:58:57,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt. + 1: [2023-04-29 10:58:57,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 10:58:57,179] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 298 +22: [2023-04-29 10:58:57,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 10:58:57,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 10:58:57,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 10:58:57,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt. +33: [2023-04-29 10:58:57,186] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 264 +51: [2023-04-29 10:58:57,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 408 +29: [2023-04-29 10:58:57,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 10:58:57,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 10:58:57,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 396 +22: [2023-04-29 10:58:57,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:57,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 6: [2023-04-29 10:58:57,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +49: [2023-04-29 10:58:57,188] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 394 + 6: [2023-04-29 10:58:57,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 10:58:57,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 10:58:57,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:57,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +13: [2023-04-29 10:58:57,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:57,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +47: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +29: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +47: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +19: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +47: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt. +29: [2023-04-29 10:58:57,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 10:58:57,196] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 392 +11: [2023-04-29 10:58:57,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:57,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +51: [2023-04-29 10:58:57,197] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 414 +29: [2023-04-29 10:58:57,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:57,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 10:58:57,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:57,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +51: [2023-04-29 10:58:57,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 412 +56: [2023-04-29 10:58:57,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 448 +11: [2023-04-29 10:58:57,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 10:58:57,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 10:58:57,204] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 410 +18: [2023-04-29 10:58:57,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 10:58:57,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +37: [2023-04-29 10:58:57,204] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 300 +11: [2023-04-29 10:58:57,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +37: [2023-04-29 10:58:57,205] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 298 +29: [2023-04-29 10:58:57,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 10:58:57,209] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 302 +27: [2023-04-29 10:58:57,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 10:58:57,210] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 450 + 0: [2023-04-29 10:58:57,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 10:58:57,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 10:58:57,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 454 +49: [2023-04-29 10:58:57,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 398 +27: [2023-04-29 10:58:57,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 10:58:57,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 10:58:57,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 10:58:57,219] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 452 +47: [2023-04-29 10:58:57,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +47: [2023-04-29 10:58:57,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:57,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt. +47: [2023-04-29 10:58:57,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 10:58:57,220] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 256 +47: [2023-04-29 10:58:57,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 10:58:57,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +17: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... +17: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... +17: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... +17: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... +20: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 10:58:57,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 10:58:57,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 10:58:57,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +10: [2023-04-29 10:58:57,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +10: [2023-04-29 10:58:57,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +10: [2023-04-29 10:58:57,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 10:58:57,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 10:58:57,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 3: [2023-04-29 10:58:57,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 3: [2023-04-29 10:58:57,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 10:58:57,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 10:58:57,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt. +37: [2023-04-29 10:58:57,237] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 296 + 1: [2023-04-29 10:58:57,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 10:58:57,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +19: [2023-04-29 10:58:57,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +19: [2023-04-29 10:58:57,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... +19: [2023-04-29 10:58:57,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... +37: [2023-04-29 10:58:57,244] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 296 + 1: [2023-04-29 10:58:57,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 10:58:57,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 5: [2023-04-29 10:58:57,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... + 1: [2023-04-29 10:58:57,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... + 5: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... + 9: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 10:58:57,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +24: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +24: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +24: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +20: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 10:58:57,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 10:58:57,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 10:58:57,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 10:58:57,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +10: [2023-04-29 10:58:57,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 10:58:57,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +20: [2023-04-29 10:58:57,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +10: [2023-04-29 10:58:57,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 10:58:57,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +27: [2023-04-29 10:58:57,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 10:58:57,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +54: [2023-04-29 10:58:57,266] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 432 + 1: [2023-04-29 10:58:57,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 1: [2023-04-29 10:58:57,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +27: [2023-04-29 10:58:57,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:57,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 10:58:57,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 390 +36: [2023-04-29 10:58:57,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 10:58:57,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 10:58:57,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +27: [2023-04-29 10:58:57,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +36: [2023-04-29 10:58:57,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +27: [2023-04-29 10:58:57,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 1: [2023-04-29 10:58:57,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +47: [2023-04-29 10:58:57,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +30: [2023-04-29 10:58:57,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +30: [2023-04-29 10:58:57,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +23: [2023-04-29 10:58:57,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 10:58:57,278] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 384 +30: [2023-04-29 10:58:57,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 10:58:57,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +47: [2023-04-29 10:58:57,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +29: [2023-04-29 10:58:57,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +47: [2023-04-29 10:58:57,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 10:58:57,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt. +43: [2023-04-29 10:58:57,283] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 350 +23: [2023-04-29 10:58:57,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 10:58:57,284] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 388 +54: [2023-04-29 10:58:57,284] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 434 +39: [2023-04-29 10:58:57,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt. +33: [2023-04-29 10:58:57,284] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 266 +23: [2023-04-29 10:58:57,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +39: [2023-04-29 10:58:57,284] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 318 +23: [2023-04-29 10:58:57,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +23: [2023-04-29 10:58:57,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +23: [2023-04-29 10:58:57,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 10:58:57,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 10:58:57,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 10:58:57,286] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 438 +47: [2023-04-29 10:58:57,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +33: [2023-04-29 10:58:57,287] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 268 + 3: [2023-04-29 10:58:57,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +33: [2023-04-29 10:58:57,290] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 264 +43: [2023-04-29 10:58:57,291] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 350 +47: [2023-04-29 10:58:57,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +47: [2023-04-29 10:58:57,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt... +54: [2023-04-29 10:58:57,292] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 436 +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 10:58:57,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +33: [2023-04-29 10:58:57,299] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 270 +36: [2023-04-29 10:58:57,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +36: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +28: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +36: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 10:58:57,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +53: [2023-04-29 10:58:57,300] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 428 + 3: [2023-04-29 10:58:57,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +13: [2023-04-29 10:58:57,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:57,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +46: [2023-04-29 10:58:57,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt. +36: [2023-04-29 10:58:57,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +36: [2023-04-29 10:58:57,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 10:58:57,303] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 368 +53: [2023-04-29 10:58:57,304] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 426 +53: [2023-04-29 10:58:57,304] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 430 +63: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +13: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +59: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +59: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +13: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +59: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +63: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +59: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +13: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:57,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 10:58:57,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:57,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +30: [2023-04-29 10:58:57,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 10:58:57,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +26: [2023-04-29 10:58:57,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +26: [2023-04-29 10:58:57,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +26: [2023-04-29 10:58:57,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 10:58:57,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 10:58:57,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:57,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 10:58:57,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 10:58:57,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 490 + 9: [2023-04-29 10:58:57,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 10:58:57,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +39: [2023-04-29 10:58:57,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt. +10: [2023-04-29 10:58:57,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 10:58:57,319] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 312 + 6: [2023-04-29 10:58:57,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 10:58:57,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 488 +14: [2023-04-29 10:58:57,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +14: [2023-04-29 10:58:57,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +14: [2023-04-29 10:58:57,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +14: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +32: [2023-04-29 10:58:57,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 262 +12: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +22: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +22: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +22: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +12: [2023-04-29 10:58:57,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 +10: [2023-04-29 10:58:57,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine +10: [2023-04-29 10:58:57,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... +16: [2023-04-29 10:58:57,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... +16: [2023-04-29 10:58:57,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... +16: [2023-04-29 10:58:57,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... +10: [2023-04-29 10:58:57,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 10:58:57,327] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 256 +10: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 1: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 1: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... + 1: [2023-04-29 10:58:57,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... +28: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 10:58:57,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:57,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +61: [2023-04-29 10:58:57,332] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 494 +63: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +61: [2023-04-29 10:58:57,332] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 492 +12: [2023-04-29 10:58:57,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:57,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:57,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:57,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt. +53: [2023-04-29 10:58:57,333] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 424 +63: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +63: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 10:58:57,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:57,335] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 282 +63: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +63: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 10:58:57,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 10:58:57,336] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 258 + 0: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 10:58:57,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 10:58:57,337] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 472 + 0: [2023-04-29 10:58:57,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 10:58:57,340] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 424 +59: [2023-04-29 10:58:57,342] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 478 +26: [2023-04-29 10:58:57,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:57,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:57,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:57,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 10:58:57,343] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 474 + 8: [2023-04-29 10:58:57,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 10:58:57,344] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 280 +59: [2023-04-29 10:58:57,345] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 476 + 0: [2023-04-29 10:58:57,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 10:58:57,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 286 +23: [2023-04-29 10:58:57,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 10:58:57,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 284 +28: [2023-04-29 10:58:57,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 10:58:57,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 10:58:57,350] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 260 + 2: [2023-04-29 10:58:57,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 2: [2023-04-29 10:58:57,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +41: [2023-04-29 10:58:57,353] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 334 +23: [2023-04-29 10:58:57,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 10:58:57,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 10:58:57,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:57,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +10: [2023-04-29 10:58:57,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 10:58:57,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 2: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +28: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +63: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +63: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +14: [2023-04-29 10:58:57,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 10:58:57,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +14: [2023-04-29 10:58:57,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:57,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 2: [2023-04-29 10:58:57,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +28: [2023-04-29 10:58:57,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 10:58:57,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 10:58:57,362] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 330 +41: [2023-04-29 10:58:57,362] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 328 +13: [2023-04-29 10:58:57,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 10:58:57,365] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 332 +16: [2023-04-29 10:58:57,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +21: [2023-04-29 10:58:57,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +21: [2023-04-29 10:58:57,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +21: [2023-04-29 10:58:57,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 10:58:57,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 10:58:57,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 10:58:57,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 10:58:57,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +30: [2023-04-29 10:58:57,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 10:58:57,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt... +30: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt... +36: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt... +26: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 10:58:57,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 10:58:57,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt... +30: [2023-04-29 10:58:57,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 10:58:57,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 10:58:57,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:57,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +30: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +29: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +29: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:57,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 10:58:57,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 10:58:57,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 10:58:57,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 10:58:57,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 10:58:57,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 10:58:57,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 10:58:57,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +12: [2023-04-29 10:58:57,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 10:58:57,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 10:58:57,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 3: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 3: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +27: [2023-04-29 10:58:57,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +27: [2023-04-29 10:58:57,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 2: [2023-04-29 10:58:57,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 10:58:57,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,392] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 446 +28: [2023-04-29 10:58:57,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 10:58:57,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,400] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 440 +55: [2023-04-29 10:58:57,402] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 442 +28: [2023-04-29 10:58:57,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +63: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt... +63: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt... +63: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt... +63: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt... +18: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,405] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 444 +18: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +32: [2023-04-29 10:58:57,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 10:58:57,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 9: [2023-04-29 10:58:57,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... + 9: [2023-04-29 10:58:57,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 9: [2023-04-29 10:58:57,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 9: [2023-04-29 10:58:57,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 8: [2023-04-29 10:58:57,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 10:58:57,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 10:58:57,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +26: [2023-04-29 10:58:57,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... + 0: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... +28: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +28: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 10:58:57,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt... +12: [2023-04-29 10:58:57,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 10:58:57,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt... +59: [2023-04-29 10:58:57,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt... +59: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt... +21: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:57,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 10:58:57,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 10:58:57,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 10:58:57,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 10:58:57,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 10:58:57,419] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 366 +15: [2023-04-29 10:58:57,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +12: [2023-04-29 10:58:57,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 10:58:57,421] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 362 +26: [2023-04-29 10:58:57,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 10:58:57,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 10:58:57,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 10:58:57,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 10:58:57,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 10:58:57,424] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 308 +41: [2023-04-29 10:58:57,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 10:58:57,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 10:58:57,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 10:58:57,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 10:58:57,426] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 360 +16: [2023-04-29 10:58:57,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 10:58:57,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 10:58:57,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 10:58:57,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 10:58:57,428] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 364 +35: [2023-04-29 10:58:57,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +28: [2023-04-29 10:58:57,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 10:58:57,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 10:58:57,431] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 324 +26: [2023-04-29 10:58:57,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +32: [2023-04-29 10:58:57,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 10:58:57,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 10:58:57,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 10:58:57,434] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 310 +23: [2023-04-29 10:58:57,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +23: [2023-04-29 10:58:57,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +23: [2023-04-29 10:58:57,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +23: [2023-04-29 10:58:57,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +32: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +53: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 10:58:57,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:57,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +53: [2023-04-29 10:58:57,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 10:58:57,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 10:58:57,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 10:58:57,439] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 306 +16: [2023-04-29 10:58:57,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 10:58:57,439] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 354 +32: [2023-04-29 10:58:57,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 10:58:57,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 10:58:57,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +16: [2023-04-29 10:58:57,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 10:58:57,442] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 304 +16: [2023-04-29 10:58:57,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +29: [2023-04-29 10:58:57,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +29: [2023-04-29 10:58:57,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 10:58:57,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 10:58:57,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 10:58:57,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 10:58:57,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 10:58:57,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 10:58:57,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 10:58:57,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +13: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... +13: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... +13: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +35: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:57,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:57,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:57,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:57,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:57,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 2: [2023-04-29 10:58:57,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +41: [2023-04-29 10:58:57,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 10:58:57,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 10:58:57,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 10:58:57,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 10:58:57,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:57,457] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 322 +41: [2023-04-29 10:58:57,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 10:58:57,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:57,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:57,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 10:58:57,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 10:58:57,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:57,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 10:58:57,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +54: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 10:58:57,462] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 336 +35: [2023-04-29 10:58:57,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:57,463] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 356 +42: [2023-04-29 10:58:57,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 10:58:57,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,464] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 320 +42: [2023-04-29 10:58:57,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 10:58:57,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 10:58:57,465] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 342 +53: [2023-04-29 10:58:57,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:57,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:57,467] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 326 +42: [2023-04-29 10:58:57,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 2: [2023-04-29 10:58:57,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 10:58:57,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +53: [2023-04-29 10:58:57,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,469] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 338 +42: [2023-04-29 10:58:57,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 2: [2023-04-29 10:58:57,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +53: [2023-04-29 10:58:57,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 10:58:57,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +14: [2023-04-29 10:58:57,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +53: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +53: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +53: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +14: [2023-04-29 10:58:57,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +53: [2023-04-29 10:58:57,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:57,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,472] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 340 +18: [2023-04-29 10:58:57,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 10:58:57,473] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 352 +44: [2023-04-29 10:58:57,473] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 358 +60: [2023-04-29 10:58:57,474] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 480 + 2: [2023-04-29 10:58:57,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 10:58:57,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +61: [2023-04-29 10:58:57,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +61: [2023-04-29 10:58:57,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +29: [2023-04-29 10:58:57,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 10:58:57,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 10:58:57,477] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 482 +18: [2023-04-29 10:58:57,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 6: [2023-04-29 10:58:57,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... +14: [2023-04-29 10:58:57,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +60: [2023-04-29 10:58:57,479] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 486 +14: [2023-04-29 10:58:57,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 10:58:57,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +43: [2023-04-29 10:58:57,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +43: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +12: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... +12: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... +12: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... +12: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... +21: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +14: [2023-04-29 10:58:57,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 10:58:57,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 10:58:57,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 10:58:57,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 10:58:57,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +41: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... +35: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 8: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... + 8: [2023-04-29 10:58:57,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... +60: [2023-04-29 10:58:57,485] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 484 +35: [2023-04-29 10:58:57,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +21: [2023-04-29 10:58:57,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 10:58:57,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 10:58:57,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +51: [2023-04-29 10:58:57,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +51: [2023-04-29 10:58:57,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +21: [2023-04-29 10:58:57,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +42: [2023-04-29 10:58:57,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 10:58:57,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 10:58:57,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 10:58:57,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 10:58:57,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 10:58:57,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 10:58:57,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 10:58:57,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 10:58:57,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 10:58:57,491] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 312 +51: [2023-04-29 10:58:57,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +21: [2023-04-29 10:58:57,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 10:58:57,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 10:58:57,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +46: [2023-04-29 10:58:57,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 10:58:57,496] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 316 +46: [2023-04-29 10:58:57,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +46: [2023-04-29 10:58:57,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,498] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 466 +60: [2023-04-29 10:58:57,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 10:58:57,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 10:58:57,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +15: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +12: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +53: [2023-04-29 10:58:57,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +53: [2023-04-29 10:58:57,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +53: [2023-04-29 10:58:57,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +61: [2023-04-29 10:58:57,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +61: [2023-04-29 10:58:57,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:57,502] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 318 +61: [2023-04-29 10:58:57,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:57,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +12: [2023-04-29 10:58:57,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 10:58:57,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 10:58:57,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 10:58:57,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 10:58:57,505] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 314 +58: [2023-04-29 10:58:57,505] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 468 + 4: [2023-04-29 10:58:57,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 10:58:57,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +52: [2023-04-29 10:58:57,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +52: [2023-04-29 10:58:57,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +52: [2023-04-29 10:58:57,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +61: [2023-04-29 10:58:57,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:57,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:57,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +61: [2023-04-29 10:58:57,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:57,508] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 464 +61: [2023-04-29 10:58:57,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 10:58:57,508] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 470 +43: [2023-04-29 10:58:57,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 10:58:57,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +43: [2023-04-29 10:58:57,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +43: [2023-04-29 10:58:57,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:57,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +43: [2023-04-29 10:58:57,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:57,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +48: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt. +43: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +28: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +28: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +28: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +43: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +48: [2023-04-29 10:58:57,513] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 386 +61: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +61: [2023-04-29 10:58:57,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +61: [2023-04-29 10:58:57,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +61: [2023-04-29 10:58:57,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 10:58:57,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +51: [2023-04-29 10:58:57,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:57,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:57,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:57,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:57,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 10:58:57,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:57,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 10:58:57,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 10:58:57,519] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 406 + 4: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +51: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +46: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:57,521] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 386 +46: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 10:58:57,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt... +51: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 10:58:57,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 10:58:57,522] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 400 +47: [2023-04-29 10:58:57,523] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 378 + 4: [2023-04-29 10:58:57,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 10:58:57,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:57,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:57,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 10:58:57,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:57,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:57,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 10:58:57,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 10:58:57,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +20: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +46: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt... +41: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt... +41: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt... +41: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt... + 6: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +46: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +20: [2023-04-29 10:58:57,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +20: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 10:58:57,528] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 380 +60: [2023-04-29 10:58:57,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 10:58:57,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +60: [2023-04-29 10:58:57,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:57,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:57,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +60: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt... +42: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt... +32: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt... +32: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt... +32: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt... +32: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt... +60: [2023-04-29 10:58:57,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 10:58:57,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,531] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 402 + 4: [2023-04-29 10:58:57,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +42: [2023-04-29 10:58:57,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt... +10: [2023-04-29 10:58:57,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... +60: [2023-04-29 10:58:57,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:57,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... +10: [2023-04-29 10:58:57,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... +10: [2023-04-29 10:58:57,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... +60: [2023-04-29 10:58:57,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:57,533] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 404 +60: [2023-04-29 10:58:57,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 10:58:57,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt... +54: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt... +35: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt... +35: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt... +54: [2023-04-29 10:58:57,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:57,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +54: [2023-04-29 10:58:57,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +26: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +26: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +26: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +52: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt... +26: [2023-04-29 10:58:57,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... +52: [2023-04-29 10:58:57,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:57,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 10:58:57,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:57,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 10:58:57,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +52: [2023-04-29 10:58:57,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 7: [2023-04-29 10:58:57,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... + 7: [2023-04-29 10:58:57,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... +29: [2023-04-29 10:58:57,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +39: [2023-04-29 10:58:57,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 10:58:57,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 10:58:57,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 10:58:57,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 10:58:57,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt... +53: [2023-04-29 10:58:57,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt... +53: [2023-04-29 10:58:57,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt... +14: [2023-04-29 10:58:57,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +53: [2023-04-29 10:58:57,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt... +47: [2023-04-29 10:58:57,544] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 382 +47: [2023-04-29 10:58:57,544] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 376 +29: [2023-04-29 10:58:57,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 10:58:57,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 10:58:57,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +61: [2023-04-29 10:58:57,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt... +61: [2023-04-29 10:58:57,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt... +61: [2023-04-29 10:58:57,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt... +61: [2023-04-29 10:58:57,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt... +29: [2023-04-29 10:58:57,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 10:58:57,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 10:58:57,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 10:58:57,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 10:58:57,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 10:58:57,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 10:58:57,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... +18: [2023-04-29 10:58:57,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... +18: [2023-04-29 10:58:57,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... +18: [2023-04-29 10:58:57,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... +43: [2023-04-29 10:58:57,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 10:58:57,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 10:58:57,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 10:58:57,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... +15: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... +15: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... +15: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +39: [2023-04-29 10:58:57,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:57,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:57,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:57,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 10:58:57,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:57,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +39: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 10:58:57,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 10:58:57,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 10:58:57,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 10:58:57,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 10:58:57,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 10:58:57,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 10:58:57,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 10:58:57,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 10:58:57,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 10:58:57,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +58: [2023-04-29 10:58:57,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 10:58:57,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:57,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:57,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 10:58:57,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +48: [2023-04-29 10:58:57,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:57,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:57,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 10:58:57,586] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 368 +60: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +60: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +60: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +48: [2023-04-29 10:58:57,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 10:58:57,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 10:58:57,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +10: [2023-04-29 10:58:57,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 10:58:57,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +48: [2023-04-29 10:58:57,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 10:58:57,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 10:58:57,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 10:58:57,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 10:58:57,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 10:58:57,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 10:58:57,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +20: [2023-04-29 10:58:57,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 10:58:57,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 10:58:57,597] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 370 +46: [2023-04-29 10:58:57,598] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 372 + 4: [2023-04-29 10:58:57,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 10:58:57,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 10:58:57,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 10:58:57,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:57,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 10:58:57,605] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 374 +58: [2023-04-29 10:58:57,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:57,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:57,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 10:58:57,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:57,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 10:58:57,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:57,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 10:58:57,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 10:58:57,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 10:58:57,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +10: [2023-04-29 10:58:57,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 10:58:57,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +62: [2023-04-29 10:58:57,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +62: [2023-04-29 10:58:57,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +58: [2023-04-29 10:58:57,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +58: [2023-04-29 10:58:57,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +58: [2023-04-29 10:58:57,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 10:58:57,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 10:58:57,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt... +43: [2023-04-29 10:58:57,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt... +10: [2023-04-29 10:58:57,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 10:58:57,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 10:58:57,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt... +43: [2023-04-29 10:58:57,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt... + 0: [2023-04-29 10:58:57,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +30: [2023-04-29 10:58:57,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 10:58:57,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 10:58:57,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 10:58:57,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +55: [2023-04-29 10:58:57,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 10:58:57,622] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 290 +55: [2023-04-29 10:58:57,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 10:58:57,623] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 292 + 6: [2023-04-29 10:58:57,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +10: [2023-04-29 10:58:57,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 10:58:57,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt... +51: [2023-04-29 10:58:57,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt... +51: [2023-04-29 10:58:57,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt... +51: [2023-04-29 10:58:57,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt... +46: [2023-04-29 10:58:57,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt... +46: [2023-04-29 10:58:57,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt... +46: [2023-04-29 10:58:57,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt... +46: [2023-04-29 10:58:57,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt... +55: [2023-04-29 10:58:57,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:57,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:57,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 10:58:57,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +55: [2023-04-29 10:58:57,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 10:58:57,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... + 0: [2023-04-29 10:58:57,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 10:58:57,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:57,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 10:58:57,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 10:58:57,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 10:58:57,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 10:58:57,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt. +60: [2023-04-29 10:58:57,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt... +60: [2023-04-29 10:58:57,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt... +40: [2023-04-29 10:58:57,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +40: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +34: [2023-04-29 10:58:57,635] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 278 +40: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt... +40: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 0: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 10:58:57,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt... +49: [2023-04-29 10:58:57,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 10:58:57,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 10:58:57,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 10:58:57,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 10:58:57,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 10:58:57,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 10:58:57,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 10:58:57,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 6: [2023-04-29 10:58:57,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 10:58:57,639] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 418 + 0: [2023-04-29 10:58:57,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... + 0: [2023-04-29 10:58:57,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +39: [2023-04-29 10:58:57,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt... +39: [2023-04-29 10:58:57,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,641] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 278 +39: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt... + 6: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt... +48: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt... +48: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt... +62: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt... +48: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt... +62: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:57,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 0: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +62: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +52: [2023-04-29 10:58:57,643] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 422 +14: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... +14: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... +14: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... +14: [2023-04-29 10:58:57,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... +52: [2023-04-29 10:58:57,644] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 416 +62: [2023-04-29 10:58:57,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 10:58:57,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +36: [2023-04-29 10:58:57,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 288 + 6: [2023-04-29 10:58:57,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +52: [2023-04-29 10:58:57,646] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 420 +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt... +52: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt... +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +62: [2023-04-29 10:58:57,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +62: [2023-04-29 10:58:57,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 10:58:57,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 10:58:57,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 10:58:57,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 4: [2023-04-29 10:58:57,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 4: [2023-04-29 10:58:57,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 4: [2023-04-29 10:58:57,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... + 4: [2023-04-29 10:58:57,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... +30: [2023-04-29 10:58:57,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:57,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 10:58:57,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 10:58:57,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 10:58:57,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 10:58:57,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 10:58:57,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 10:58:57,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt... +58: [2023-04-29 10:58:57,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt... +58: [2023-04-29 10:58:57,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt... +58: [2023-04-29 10:58:57,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt... +56: [2023-04-29 10:58:57,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:57,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:57,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 10:58:57,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 10:58:57,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 10:58:57,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 10:58:57,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 10:58:57,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 10:58:57,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:57,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:57,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 10:58:57,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +56: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +56: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 10:58:57,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:57,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:57,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 10:58:57,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +50: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +50: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +40: [2023-04-29 10:58:57,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 10:58:57,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 10:58:57,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +10: [2023-04-29 10:58:57,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 10:58:57,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +33: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +10: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +10: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +33: [2023-04-29 10:58:57,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +20: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +33: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... +20: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +44: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 10:58:57,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +34: [2023-04-29 10:58:57,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 10:58:57,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 10:58:57,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 10:58:57,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 10:58:57,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +34: [2023-04-29 10:58:57,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +34: [2023-04-29 10:58:57,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +44: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +10: [2023-04-29 10:58:57,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt... +55: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt... +55: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt... +55: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt... +33: [2023-04-29 10:58:57,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 10:58:57,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 10:58:57,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 10:58:57,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:57,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 10:58:57,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +62: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt... +62: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt... +62: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 10:58:57,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +62: [2023-04-29 10:58:57,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 10:58:57,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 10:58:57,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 10:58:57,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 10:58:57,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 10:58:57,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 10:58:57,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 10:58:57,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. + 2: [2023-04-29 10:58:57,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 2: [2023-04-29 10:58:57,714] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 22 +50: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt... +49: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt... +49: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt... +49: [2023-04-29 10:58:57,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt... +38: [2023-04-29 10:58:57,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 10:58:57,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 10:58:57,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 10:58:57,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +30: [2023-04-29 10:58:57,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 10:58:57,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:57,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:57,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:57,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +34: [2023-04-29 10:58:57,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:57,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +34: [2023-04-29 10:58:57,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:57,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 10:58:57,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +30: [2023-04-29 10:58:57,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,723] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 22 +30: [2023-04-29 10:58:57,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +30: [2023-04-29 10:58:57,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 10:58:57,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt... +56: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt... +56: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt... +56: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt... +40: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt... +40: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt... +40: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +34: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +34: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +34: [2023-04-29 10:58:57,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +30: [2023-04-29 10:58:57,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 10:58:57,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +30: [2023-04-29 10:58:57,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +36: [2023-04-29 10:58:57,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt. +45: [2023-04-29 10:58:57,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 10:58:57,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +36: [2023-04-29 10:58:57,733] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 294 +45: [2023-04-29 10:58:57,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:57,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 10:58:57,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:57,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 10:58:57,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 10:58:57,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 10:58:57,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt... +33: [2023-04-29 10:58:57,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt... +33: [2023-04-29 10:58:57,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt... +33: [2023-04-29 10:58:57,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt... +36: [2023-04-29 10:58:57,742] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 294 +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 10:58:57,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +17: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. +38: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +17: [2023-04-29 10:58:57,744] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 136 +38: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 10:58:57,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +12: [2023-04-29 10:58:57,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 10:58:57,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 10:58:57,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 10:58:57,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 10:58:57,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. +17: [2023-04-29 10:58:57,750] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 138 +17: [2023-04-29 10:58:57,751] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 136 +19: [2023-04-29 10:58:57,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. +19: [2023-04-29 10:58:57,752] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 154 +38: [2023-04-29 10:58:57,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 10:58:57,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 10:58:57,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 10:58:57,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +17: [2023-04-29 10:58:57,757] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 138 +19: [2023-04-29 10:58:57,760] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 154 +50: [2023-04-29 10:58:57,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt... +50: [2023-04-29 10:58:57,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt... +22: [2023-04-29 10:58:57,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 10:58:57,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 10:58:57,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 10:58:57,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +34: [2023-04-29 10:58:57,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt... +34: [2023-04-29 10:58:57,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt... +12: [2023-04-29 10:58:57,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 10:58:57,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 10:58:57,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 3: [2023-04-29 10:58:57,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 10:58:57,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:57,783] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 206 +44: [2023-04-29 10:58:57,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt... +44: [2023-04-29 10:58:57,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt... +44: [2023-04-29 10:58:57,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt... +44: [2023-04-29 10:58:57,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt... +45: [2023-04-29 10:58:57,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt... +45: [2023-04-29 10:58:57,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt... +45: [2023-04-29 10:58:57,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt... +45: [2023-04-29 10:58:57,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt... +25: [2023-04-29 10:58:57,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 206 +38: [2023-04-29 10:58:57,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt... +38: [2023-04-29 10:58:57,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt... +38: [2023-04-29 10:58:57,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt... +38: [2023-04-29 10:58:57,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt... +37: [2023-04-29 10:58:57,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 10:58:57,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 10:58:57,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 10:58:57,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 10:58:57,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:57,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:57,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:57,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:57,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:57,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:57,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 10:58:57,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 10:58:57,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +31: [2023-04-29 10:58:57,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +31: [2023-04-29 10:58:57,827] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 250 +37: [2023-04-29 10:58:57,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 10:58:57,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 10:58:57,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 10:58:57,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +37: [2023-04-29 10:58:57,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +37: [2023-04-29 10:58:57,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +30: [2023-04-29 10:58:57,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +30: [2023-04-29 10:58:57,830] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 244 +37: [2023-04-29 10:58:57,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +31: [2023-04-29 10:58:57,835] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 250 +30: [2023-04-29 10:58:57,839] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 244 +12: [2023-04-29 10:58:57,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 10:58:57,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. + 2: [2023-04-29 10:58:57,844] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 18 +12: [2023-04-29 10:58:57,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +12: [2023-04-29 10:58:57,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 10:58:57,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 10:58:57,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 10:58:57,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 10:58:57,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 10:58:57,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 10:58:57,854] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 18 +12: [2023-04-29 10:58:57,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +12: [2023-04-29 10:58:57,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 10:58:57,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 10:58:57,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:57,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt... +24: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 10:58:57,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 10:58:57,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 10:58:57,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 10:58:57,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 10:58:57,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 10:58:57,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:57,864] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 202 +25: [2023-04-29 10:58:57,871] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 202 +37: [2023-04-29 10:58:57,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt... +37: [2023-04-29 10:58:57,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt... +37: [2023-04-29 10:58:57,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt... +37: [2023-04-29 10:58:57,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt... + 3: [2023-04-29 10:58:57,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt... + 3: [2023-04-29 10:58:57,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt... + 3: [2023-04-29 10:58:57,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt... + 3: [2023-04-29 10:58:57,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt... +22: [2023-04-29 10:58:57,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt... +22: [2023-04-29 10:58:57,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt... +22: [2023-04-29 10:58:57,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt... +22: [2023-04-29 10:58:57,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt... + 2: [2023-04-29 10:58:57,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 2: [2023-04-29 10:58:57,898] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 16 + 1: [2023-04-29 10:58:57,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 10:58:57,906] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 16 +43: [2023-04-29 10:58:57,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt. +43: [2023-04-29 10:58:57,917] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 346 +43: [2023-04-29 10:58:57,925] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 346 +21: [2023-04-29 10:58:57,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:57,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 10:58:57,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 10:58:57,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 10:58:57,925] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 170 +25: [2023-04-29 10:58:57,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. + 2: [2023-04-29 10:58:57,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 5: [2023-04-29 10:58:57,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 46 + 2: [2023-04-29 10:58:57,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 20 +21: [2023-04-29 10:58:57,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 170 +31: [2023-04-29 10:58:57,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. +31: [2023-04-29 10:58:57,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 248 +31: [2023-04-29 10:58:57,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 10:58:57,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 10:58:57,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 10:58:57,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +31: [2023-04-29 10:58:57,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 10:58:57,936] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 252 + 2: [2023-04-29 10:58:57,938] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 20 +31: [2023-04-29 10:58:57,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 248 + 5: [2023-04-29 10:58:57,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 46 +17: [2023-04-29 10:58:57,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt... +17: [2023-04-29 10:58:57,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt... +17: [2023-04-29 10:58:57,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt... +17: [2023-04-29 10:58:57,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt... +31: [2023-04-29 10:58:57,944] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 252 +19: [2023-04-29 10:58:57,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt... +19: [2023-04-29 10:58:57,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt... +19: [2023-04-29 10:58:57,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt... +19: [2023-04-29 10:58:57,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt... + 1: [2023-04-29 10:58:57,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 1: [2023-04-29 10:58:57,949] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 8 +31: [2023-04-29 10:58:57,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +31: [2023-04-29 10:58:57,953] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 254 + 5: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt... + 1: [2023-04-29 10:58:57,956] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 8 +24: [2023-04-29 10:58:57,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt... +24: [2023-04-29 10:58:57,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt... +24: [2023-04-29 10:58:57,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt... +31: [2023-04-29 10:58:57,962] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 254 +27: [2023-04-29 10:58:57,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt... +27: [2023-04-29 10:58:57,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt... +27: [2023-04-29 10:58:57,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt... +27: [2023-04-29 10:58:57,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt... + 8: [2023-04-29 10:58:57,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 10:58:57,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +16: [2023-04-29 10:58:57,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:57,975] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 134 +57: [2023-04-29 10:58:57,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 10:58:57,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 10:58:57,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 10:58:57,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +16: [2023-04-29 10:58:57,983] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 134 +17: [2023-04-29 10:58:57,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. +17: [2023-04-29 10:58:57,985] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 142 +22: [2023-04-29 10:58:57,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +22: [2023-04-29 10:58:57,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 178 +23: [2023-04-29 10:58:57,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +23: [2023-04-29 10:58:57,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 10:58:57,995] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 142 +22: [2023-04-29 10:58:57,995] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 178 +23: [2023-04-29 10:58:57,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +23: [2023-04-29 10:58:57,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:57,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt... + 1: [2023-04-29 10:58:57,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt... + 1: [2023-04-29 10:58:57,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt... + 1: [2023-04-29 10:58:57,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt... +13: [2023-04-29 10:58:58,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 10:58:58,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 10:58:58,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 10:58:58,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +16: [2023-04-29 10:58:58,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:58,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 132 + 6: [2023-04-29 10:58:58,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. + 6: [2023-04-29 10:58:58,012] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 48 +25: [2023-04-29 10:58:58,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt... +31: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt... +31: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt... +25: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt... +25: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt... +25: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt... +31: [2023-04-29 10:58:58,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt... +16: [2023-04-29 10:58:58,015] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 132 +31: [2023-04-29 10:58:58,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt... +57: [2023-04-29 10:58:58,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:58,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:58,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +57: [2023-04-29 10:58:58,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 10:58:58,021] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 48 +57: [2023-04-29 10:58:58,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 10:58:58,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 10:58:58,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 10:58:58,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 10:58:58,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 10:58:58,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +57: [2023-04-29 10:58:58,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. + 3: [2023-04-29 10:58:58,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. + 3: [2023-04-29 10:58:58,028] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 28 + 9: [2023-04-29 10:58:58,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 9: [2023-04-29 10:58:58,032] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 74 + 3: [2023-04-29 10:58:58,035] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 28 + 9: [2023-04-29 10:58:58,038] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 74 + 9: [2023-04-29 10:58:58,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 10:58:58,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 10:58:58,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 10:58:58,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 10:58:58,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. +19: [2023-04-29 10:58:58,044] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 158 +19: [2023-04-29 10:58:58,053] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 158 +54: [2023-04-29 10:58:58,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt. +54: [2023-04-29 10:58:58,053] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 437 + 5: [2023-04-29 10:58:58,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt... + 5: [2023-04-29 10:58:58,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt... + 5: [2023-04-29 10:58:58,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt... + 5: [2023-04-29 10:58:58,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt... +13: [2023-04-29 10:58:58,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. +13: [2023-04-29 10:58:58,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 108 +47: [2023-04-29 10:58:58,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +47: [2023-04-29 10:58:58,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +47: [2023-04-29 10:58:58,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +47: [2023-04-29 10:58:58,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 10:58:58,060] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 437 +13: [2023-04-29 10:58:58,065] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 108 +21: [2023-04-29 10:58:58,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. +21: [2023-04-29 10:58:58,076] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 168 + 9: [2023-04-29 10:58:58,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 9: [2023-04-29 10:58:58,077] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 78 + 8: [2023-04-29 10:58:58,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt... + 8: [2023-04-29 10:58:58,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt... + 8: [2023-04-29 10:58:58,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt... + 8: [2023-04-29 10:58:58,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt... +15: [2023-04-29 10:58:58,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 10:58:58,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 10:58:58,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 10:58:58,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 10:58:58,082] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 168 +57: [2023-04-29 10:58:58,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt... +57: [2023-04-29 10:58:58,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt... +57: [2023-04-29 10:58:58,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt... +57: [2023-04-29 10:58:58,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt... +47: [2023-04-29 10:58:58,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:58,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 10:58:58,085] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 78 +47: [2023-04-29 10:58:58,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:58,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:58,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +47: [2023-04-29 10:58:58,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +11: [2023-04-29 10:58:58,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +11: [2023-04-29 10:58:58,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +11: [2023-04-29 10:58:58,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +11: [2023-04-29 10:58:58,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +47: [2023-04-29 10:58:58,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:58,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 10:58:58,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:58,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +47: [2023-04-29 10:58:58,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 10:58:58,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt... +21: [2023-04-29 10:58:58,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +21: [2023-04-29 10:58:58,096] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 172 +21: [2023-04-29 10:58:58,104] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 172 +24: [2023-04-29 10:58:58,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +24: [2023-04-29 10:58:58,112] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 192 +47: [2023-04-29 10:58:58,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 10:58:58,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 10:58:58,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 10:58:58,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt. +13: [2023-04-29 10:58:58,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt... +13: [2023-04-29 10:58:58,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt... +13: [2023-04-29 10:58:58,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt... +13: [2023-04-29 10:58:58,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt... +23: [2023-04-29 10:58:58,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt... +23: [2023-04-29 10:58:58,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt... +23: [2023-04-29 10:58:58,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt... +23: [2023-04-29 10:58:58,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt... +24: [2023-04-29 10:58:58,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 192 +16: [2023-04-29 10:58:58,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +16: [2023-04-29 10:58:58,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:58,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:58,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 10:58:58,122] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 12 +16: [2023-04-29 10:58:58,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 10:58:58,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. + 5: [2023-04-29 10:58:58,125] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 42 + 1: [2023-04-29 10:58:58,130] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 12 + 5: [2023-04-29 10:58:58,133] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 42 + 9: [2023-04-29 10:58:58,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt... + 9: [2023-04-29 10:58:58,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt... + 9: [2023-04-29 10:58:58,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt... + 9: [2023-04-29 10:58:58,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt... +36: [2023-04-29 10:58:58,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt. +36: [2023-04-29 10:58:58,137] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 295 + 8: [2023-04-29 10:58:58,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. + 8: [2023-04-29 10:58:58,149] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 66 + 9: [2023-04-29 10:58:58,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. + 9: [2023-04-29 10:58:58,152] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 72 +26: [2023-04-29 10:58:58,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +26: [2023-04-29 10:58:58,154] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 214 + 8: [2023-04-29 10:58:58,158] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 66 + 3: [2023-04-29 10:58:58,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 3: [2023-04-29 10:58:58,160] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 26 +47: [2023-04-29 10:58:58,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt... +47: [2023-04-29 10:58:58,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt... +47: [2023-04-29 10:58:58,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt... +47: [2023-04-29 10:58:58,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt... + 9: [2023-04-29 10:58:58,160] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 72 +26: [2023-04-29 10:58:58,162] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 214 +41: [2023-04-29 10:58:58,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt. +41: [2023-04-29 10:58:58,164] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 331 +11: [2023-04-29 10:58:58,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt... +11: [2023-04-29 10:58:58,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt... +11: [2023-04-29 10:58:58,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt... +11: [2023-04-29 10:58:58,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt... +23: [2023-04-29 10:58:58,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +23: [2023-04-29 10:58:58,167] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 184 +35: [2023-04-29 10:58:58,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt. + 3: [2023-04-29 10:58:58,168] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 26 +35: [2023-04-29 10:58:58,168] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 281 +41: [2023-04-29 10:58:58,171] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 331 +42: [2023-04-29 10:58:58,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt. +42: [2023-04-29 10:58:58,175] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 339 +35: [2023-04-29 10:58:58,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 281 +23: [2023-04-29 10:58:58,177] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 184 +18: [2023-04-29 10:58:58,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 10:58:58,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 10:58:58,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 10:58:58,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +59: [2023-04-29 10:58:58,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt. +59: [2023-04-29 10:58:58,184] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 473 +22: [2023-04-29 10:58:58,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +22: [2023-04-29 10:58:58,186] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 182 +59: [2023-04-29 10:58:58,190] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 473 +35: [2023-04-29 10:58:58,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt. +22: [2023-04-29 10:58:58,193] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 182 +35: [2023-04-29 10:58:58,193] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 287 +24: [2023-04-29 10:58:58,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +24: [2023-04-29 10:58:58,194] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 194 +26: [2023-04-29 10:58:58,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +26: [2023-04-29 10:58:58,195] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 208 +35: [2023-04-29 10:58:58,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt. +35: [2023-04-29 10:58:58,197] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 283 +39: [2023-04-29 10:58:58,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt. +35: [2023-04-29 10:58:58,200] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 287 +39: [2023-04-29 10:58:58,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 313 +24: [2023-04-29 10:58:58,200] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 194 +26: [2023-04-29 10:58:58,203] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 208 +63: [2023-04-29 10:58:58,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt. +63: [2023-04-29 10:58:58,204] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 505 +22: [2023-04-29 10:58:58,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +35: [2023-04-29 10:58:58,205] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 283 +22: [2023-04-29 10:58:58,205] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 176 +16: [2023-04-29 10:58:58,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt... +16: [2023-04-29 10:58:58,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt... +16: [2023-04-29 10:58:58,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt... +16: [2023-04-29 10:58:58,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt... +15: [2023-04-29 10:58:58,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt... +15: [2023-04-29 10:58:58,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt... +15: [2023-04-29 10:58:58,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt... +15: [2023-04-29 10:58:58,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt... +41: [2023-04-29 10:58:58,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt. +41: [2023-04-29 10:58:58,210] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 333 +22: [2023-04-29 10:58:58,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 176 +43: [2023-04-29 10:58:58,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt. +43: [2023-04-29 10:58:58,211] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 345 +63: [2023-04-29 10:58:58,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 505 +28: [2023-04-29 10:58:58,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +28: [2023-04-29 10:58:58,213] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 230 +41: [2023-04-29 10:58:58,217] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 333 +41: [2023-04-29 10:58:58,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt. +41: [2023-04-29 10:58:58,218] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 335 +43: [2023-04-29 10:58:58,219] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 345 +28: [2023-04-29 10:58:58,219] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 230 + 8: [2023-04-29 10:58:58,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 8: [2023-04-29 10:58:58,220] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 68 +61: [2023-04-29 10:58:58,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt. +61: [2023-04-29 10:58:58,222] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 491 +41: [2023-04-29 10:58:58,225] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 335 + 8: [2023-04-29 10:58:58,226] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 68 +15: [2023-04-29 10:58:58,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +15: [2023-04-29 10:58:58,229] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 120 +23: [2023-04-29 10:58:58,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. +23: [2023-04-29 10:58:58,233] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 186 +39: [2023-04-29 10:58:58,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt. +39: [2023-04-29 10:58:58,236] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 315 +29: [2023-04-29 10:58:58,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +29: [2023-04-29 10:58:58,237] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 236 + 7: [2023-04-29 10:58:58,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 10:58:58,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 10:58:58,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 10:58:58,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 10:58:58,238] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 120 +23: [2023-04-29 10:58:58,240] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 186 +29: [2023-04-29 10:58:58,244] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 236 +62: [2023-04-29 10:58:58,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt. +62: [2023-04-29 10:58:58,246] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 501 +15: [2023-04-29 10:58:58,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +15: [2023-04-29 10:58:58,250] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 124 +61: [2023-04-29 10:58:58,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt. +13: [2023-04-29 10:58:58,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. +61: [2023-04-29 10:58:58,255] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 489 +13: [2023-04-29 10:58:58,255] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 104 +15: [2023-04-29 10:58:58,257] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 124 +13: [2023-04-29 10:58:58,264] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 104 + 0: [2023-04-29 10:58:58,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. + 0: [2023-04-29 10:58:58,271] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 6 + 0: [2023-04-29 10:58:58,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 10:58:58,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 10:58:58,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 10:58:58,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 10:58:58,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt... +18: [2023-04-29 10:58:58,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt... +18: [2023-04-29 10:58:58,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt... +18: [2023-04-29 10:58:58,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt... + 0: [2023-04-29 10:58:58,279] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 6 +18: [2023-04-29 10:58:58,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +18: [2023-04-29 10:58:58,281] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 148 +14: [2023-04-29 10:58:58,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +14: [2023-04-29 10:58:58,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +14: [2023-04-29 10:58:58,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +14: [2023-04-29 10:58:58,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +39: [2023-04-29 10:58:58,284] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 313 +39: [2023-04-29 10:58:58,287] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 315 +18: [2023-04-29 10:58:58,290] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 148 +62: [2023-04-29 10:58:58,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt. +62: [2023-04-29 10:58:58,290] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 497 +61: [2023-04-29 10:58:58,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt. +61: [2023-04-29 10:58:58,293] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 495 +49: [2023-04-29 10:58:58,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt. +49: [2023-04-29 10:58:58,300] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 399 +28: [2023-04-29 10:58:58,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 10:58:58,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 10:58:58,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 10:58:58,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 10:58:58,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 6: [2023-04-29 10:58:58,306] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 54 +49: [2023-04-29 10:58:58,307] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 399 +29: [2023-04-29 10:58:58,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 10:58:58,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +34: [2023-04-29 10:58:58,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt. +34: [2023-04-29 10:58:58,312] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 277 +29: [2023-04-29 10:58:58,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 10:58:58,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 10:58:58,312] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 54 + 7: [2023-04-29 10:58:58,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt... + 7: [2023-04-29 10:58:58,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt... + 7: [2023-04-29 10:58:58,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt... + 7: [2023-04-29 10:58:58,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. +12: [2023-04-29 10:58:58,319] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 98 +44: [2023-04-29 10:58:58,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt. +44: [2023-04-29 10:58:58,320] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 359 +30: [2023-04-29 10:58:58,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 10:58:58,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 10:58:58,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 10:58:58,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 10:58:58,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 10:58:58,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 10:58:58,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 10:58:58,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:58,329] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 98 +50: [2023-04-29 10:58:58,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt. +50: [2023-04-29 10:58:58,338] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 405 +10: [2023-04-29 10:58:58,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 10:58:58,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +55: [2023-04-29 10:58:58,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt. +55: [2023-04-29 10:58:58,339] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 443 +10: [2023-04-29 10:58:58,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 10:58:58,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +46: [2023-04-29 10:58:58,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt. +62: [2023-04-29 10:58:58,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt. +46: [2023-04-29 10:58:58,345] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 369 +62: [2023-04-29 10:58:58,345] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 503 +43: [2023-04-29 10:58:58,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt. +43: [2023-04-29 10:58:58,346] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 349 +55: [2023-04-29 10:58:58,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 443 +50: [2023-04-29 10:58:58,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 405 +49: [2023-04-29 10:58:58,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt. +49: [2023-04-29 10:58:58,352] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 397 +46: [2023-04-29 10:58:58,352] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 369 + 2: [2023-04-29 10:58:58,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt... + 0: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt... + 0: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt... + 0: [2023-04-29 10:58:58,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt... +43: [2023-04-29 10:58:58,355] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 349 +61: [2023-04-29 10:58:58,355] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 495 +61: [2023-04-29 10:58:58,356] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 489 +49: [2023-04-29 10:58:58,358] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 397 +60: [2023-04-29 10:58:58,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt. +60: [2023-04-29 10:58:58,361] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 485 +61: [2023-04-29 10:58:58,362] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 491 +21: [2023-04-29 10:58:58,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 10:58:58,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 10:58:58,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 10:58:58,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 10:58:58,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. +19: [2023-04-29 10:58:58,364] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 156 +23: [2023-04-29 10:58:58,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +23: [2023-04-29 10:58:58,365] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 188 +62: [2023-04-29 10:58:58,367] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 497 +60: [2023-04-29 10:58:58,368] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 485 + 4: [2023-04-29 10:58:58,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 10:58:58,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 10:58:58,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 10:58:58,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +62: [2023-04-29 10:58:58,371] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 503 +19: [2023-04-29 10:58:58,372] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 156 +62: [2023-04-29 10:58:58,372] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 501 +62: [2023-04-29 10:58:58,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt. +62: [2023-04-29 10:58:58,372] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 499 +33: [2023-04-29 10:58:58,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt. +33: [2023-04-29 10:58:58,373] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 265 +23: [2023-04-29 10:58:58,373] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 188 +55: [2023-04-29 10:58:58,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt. +55: [2023-04-29 10:58:58,375] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 441 +20: [2023-04-29 10:58:58,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 10:58:58,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. +14: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt... +14: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt... +14: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt... +14: [2023-04-29 10:58:58,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,379] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 96 +62: [2023-04-29 10:58:58,379] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 499 +33: [2023-04-29 10:58:58,380] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 265 +55: [2023-04-29 10:58:58,381] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 441 +60: [2023-04-29 10:58:58,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt. +42: [2023-04-29 10:58:58,384] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 339 +32: [2023-04-29 10:58:58,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt. +60: [2023-04-29 10:58:58,385] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 481 +32: [2023-04-29 10:58:58,384] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 259 +44: [2023-04-29 10:58:58,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt. +44: [2023-04-29 10:58:58,385] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 357 + 5: [2023-04-29 10:58:58,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 5: [2023-04-29 10:58:58,386] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 44 + 6: [2023-04-29 10:58:58,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 10:58:58,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 10:58:58,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +63: [2023-04-29 10:58:58,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt. + 6: [2023-04-29 10:58:58,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +63: [2023-04-29 10:58:58,388] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 507 +12: [2023-04-29 10:58:58,389] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 96 +28: [2023-04-29 10:58:58,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt... +28: [2023-04-29 10:58:58,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt... +32: [2023-04-29 10:58:58,391] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 259 +60: [2023-04-29 10:58:58,392] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 481 +28: [2023-04-29 10:58:58,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. +28: [2023-04-29 10:58:58,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,392] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 82 + 5: [2023-04-29 10:58:58,392] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 44 +63: [2023-04-29 10:58:58,395] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 507 +46: [2023-04-29 10:58:58,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt. +46: [2023-04-29 10:58:58,396] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 373 +29: [2023-04-29 10:58:58,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt... +29: [2023-04-29 10:58:58,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt... +29: [2023-04-29 10:58:58,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt... +29: [2023-04-29 10:58:58,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,400] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 82 +34: [2023-04-29 10:58:58,403] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 277 +46: [2023-04-29 10:58:58,403] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 373 +26: [2023-04-29 10:58:58,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt... +26: [2023-04-29 10:58:58,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt... +26: [2023-04-29 10:58:58,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt... +52: [2023-04-29 10:58:58,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt. +52: [2023-04-29 10:58:58,406] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 423 +26: [2023-04-29 10:58:58,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt... +34: [2023-04-29 10:58:58,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt. +34: [2023-04-29 10:58:58,407] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 274 +12: [2023-04-29 10:58:58,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. +12: [2023-04-29 10:58:58,409] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 100 +61: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt. +61: [2023-04-29 10:58:58,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 493 +60: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt. +30: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt... +30: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt... +30: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt... +60: [2023-04-29 10:58:58,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 483 +27: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +27: [2023-04-29 10:58:58,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 222 +30: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt... + 0: [2023-04-29 10:58:58,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. + 0: [2023-04-29 10:58:58,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 2 +56: [2023-04-29 10:58:58,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt. +56: [2023-04-29 10:58:58,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 451 +36: [2023-04-29 10:58:58,413] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 295 +25: [2023-04-29 10:58:58,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:58,413] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 204 +34: [2023-04-29 10:58:58,415] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 274 +13: [2023-04-29 10:58:58,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. +13: [2023-04-29 10:58:58,416] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 110 +12: [2023-04-29 10:58:58,416] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 100 +61: [2023-04-29 10:58:58,417] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 493 +27: [2023-04-29 10:58:58,418] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 222 +60: [2023-04-29 10:58:58,418] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 483 +56: [2023-04-29 10:58:58,419] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 451 +25: [2023-04-29 10:58:58,420] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 204 + 0: [2023-04-29 10:58:58,420] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 2 +52: [2023-04-29 10:58:58,423] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 423 +13: [2023-04-29 10:58:58,424] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 110 + 2: [2023-04-29 10:58:58,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt... + 2: [2023-04-29 10:58:58,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt... + 2: [2023-04-29 10:58:58,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt... + 2: [2023-04-29 10:58:58,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt... +10: [2023-04-29 10:58:58,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt... +27: [2023-04-29 10:58:58,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +27: [2023-04-29 10:58:58,426] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 218 +38: [2023-04-29 10:58:58,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt. +38: [2023-04-29 10:58:58,428] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 307 +27: [2023-04-29 10:58:58,433] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 218 +21: [2023-04-29 10:58:58,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt... +21: [2023-04-29 10:58:58,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt... +21: [2023-04-29 10:58:58,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt... +21: [2023-04-29 10:58:58,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt... +54: [2023-04-29 10:58:58,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt. +54: [2023-04-29 10:58:58,439] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 435 +38: [2023-04-29 10:58:58,439] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 307 +36: [2023-04-29 10:58:58,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt. +36: [2023-04-29 10:58:58,440] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 289 +42: [2023-04-29 10:58:58,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt. +42: [2023-04-29 10:58:58,441] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 341 +32: [2023-04-29 10:58:58,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt. +45: [2023-04-29 10:58:58,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt. +32: [2023-04-29 10:58:58,442] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 257 +45: [2023-04-29 10:58:58,443] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 363 +54: [2023-04-29 10:58:58,445] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 435 +38: [2023-04-29 10:58:58,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt. +38: [2023-04-29 10:58:58,446] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 309 +36: [2023-04-29 10:58:58,446] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 289 +42: [2023-04-29 10:58:58,448] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 341 +32: [2023-04-29 10:58:58,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 257 +45: [2023-04-29 10:58:58,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 363 +42: [2023-04-29 10:58:58,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt. +42: [2023-04-29 10:58:58,451] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 337 +26: [2023-04-29 10:58:58,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +38: [2023-04-29 10:58:58,453] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 309 +26: [2023-04-29 10:58:58,453] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 212 + 4: [2023-04-29 10:58:58,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt... + 4: [2023-04-29 10:58:58,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt... + 4: [2023-04-29 10:58:58,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt... + 4: [2023-04-29 10:58:58,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt... +42: [2023-04-29 10:58:58,458] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 337 +26: [2023-04-29 10:58:58,461] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 212 +20: [2023-04-29 10:58:58,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt... +20: [2023-04-29 10:58:58,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt... +20: [2023-04-29 10:58:58,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt... +20: [2023-04-29 10:58:58,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt... + 4: [2023-04-29 10:58:58,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. + 4: [2023-04-29 10:58:58,470] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 36 + 6: [2023-04-29 10:58:58,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt... + 6: [2023-04-29 10:58:58,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt... + 6: [2023-04-29 10:58:58,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt... + 6: [2023-04-29 10:58:58,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:58,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:58,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 10:58:58,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 10:58:58,476] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 36 +25: [2023-04-29 10:58:58,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:58,478] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 200 +25: [2023-04-29 10:58:58,485] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 200 +28: [2023-04-29 10:58:58,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +28: [2023-04-29 10:58:58,488] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 228 +30: [2023-04-29 10:58:58,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +30: [2023-04-29 10:58:58,491] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 240 + 8: [2023-04-29 10:58:58,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. + 8: [2023-04-29 10:58:58,493] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 64 +34: [2023-04-29 10:58:58,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt. +34: [2023-04-29 10:58:58,493] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 273 +28: [2023-04-29 10:58:58,496] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 228 + 3: [2023-04-29 10:58:58,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. + 3: [2023-04-29 10:58:58,497] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 30 + 8: [2023-04-29 10:58:58,500] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 64 +30: [2023-04-29 10:58:58,501] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 240 +34: [2023-04-29 10:58:58,501] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 273 + 3: [2023-04-29 10:58:58,504] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 30 +52: [2023-04-29 10:58:58,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt. +52: [2023-04-29 10:58:58,509] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 419 +30: [2023-04-29 10:58:58,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +30: [2023-04-29 10:58:58,509] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 246 +39: [2023-04-29 10:58:58,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt. +39: [2023-04-29 10:58:58,513] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 317 +52: [2023-04-29 10:58:58,517] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 419 +19: [2023-04-29 10:58:58,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt. +30: [2023-04-29 10:58:58,517] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 246 +19: [2023-04-29 10:58:58,517] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 157 +31: [2023-04-29 10:58:58,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt. +31: [2023-04-29 10:58:58,521] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 253 +39: [2023-04-29 10:58:58,521] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 317 +32: [2023-04-29 10:58:58,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt. +32: [2023-04-29 10:58:58,523] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 263 +19: [2023-04-29 10:58:58,524] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 157 +44: [2023-04-29 10:58:58,525] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 357 +44: [2023-04-29 10:58:58,526] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 359 +31: [2023-04-29 10:58:58,528] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 253 + 3: [2023-04-29 10:58:58,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt. + 3: [2023-04-29 10:58:58,532] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 29 +32: [2023-04-29 10:58:58,532] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 263 +48: [2023-04-29 10:58:58,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt. +48: [2023-04-29 10:58:58,538] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 391 + 3: [2023-04-29 10:58:58,539] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 29 + 1: [2023-04-29 10:58:58,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt. + 1: [2023-04-29 10:58:58,543] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 13 +48: [2023-04-29 10:58:58,545] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 391 +35: [2023-04-29 10:58:58,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt. +35: [2023-04-29 10:58:58,547] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 285 + 1: [2023-04-29 10:58:58,550] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 13 + 3: [2023-04-29 10:58:58,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt. + 3: [2023-04-29 10:58:58,552] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 27 + 1: [2023-04-29 10:58:58,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt. + 1: [2023-04-29 10:58:58,555] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 15 +35: [2023-04-29 10:58:58,556] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 285 +12: [2023-04-29 10:58:58,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt... +12: [2023-04-29 10:58:58,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt... + 3: [2023-04-29 10:58:58,559] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 27 +44: [2023-04-29 10:58:58,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt. + 1: [2023-04-29 10:58:58,562] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 15 +44: [2023-04-29 10:58:58,562] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 355 +33: [2023-04-29 10:58:58,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt. +33: [2023-04-29 10:58:58,564] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 271 +44: [2023-04-29 10:58:58,568] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 355 +33: [2023-04-29 10:58:58,572] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 271 +40: [2023-04-29 10:58:58,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt. +40: [2023-04-29 10:58:58,577] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 323 + 5: [2023-04-29 10:58:58,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt. + 5: [2023-04-29 10:58:58,577] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 47 + 4: [2023-04-29 10:58:58,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. + 4: [2023-04-29 10:58:58,579] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 32 +34: [2023-04-29 10:58:58,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt. +34: [2023-04-29 10:58:58,579] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 275 +53: [2023-04-29 10:58:58,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt. +53: [2023-04-29 10:58:58,582] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 425 +40: [2023-04-29 10:58:58,583] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 323 + 5: [2023-04-29 10:58:58,584] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 47 +24: [2023-04-29 10:58:58,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt. +24: [2023-04-29 10:58:58,586] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 197 +34: [2023-04-29 10:58:58,587] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 275 + 4: [2023-04-29 10:58:58,587] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 32 +53: [2023-04-29 10:58:58,589] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 425 +50: [2023-04-29 10:58:58,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt. +50: [2023-04-29 10:58:58,590] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 401 +24: [2023-04-29 10:58:58,593] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 197 +50: [2023-04-29 10:58:58,597] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 401 + 5: [2023-04-29 10:58:58,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt. + 5: [2023-04-29 10:58:58,603] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 45 + 0: [2023-04-29 10:58:58,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. + 0: [2023-04-29 10:58:58,608] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 0 + 5: [2023-04-29 10:58:58,610] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 45 +17: [2023-04-29 10:58:58,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt. +17: [2023-04-29 10:58:58,611] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 143 +17: [2023-04-29 10:58:58,618] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 143 + 0: [2023-04-29 10:58:58,618] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 0 +51: [2023-04-29 10:58:58,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt. +27: [2023-04-29 10:58:58,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt. +10: [2023-04-29 10:58:58,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. +27: [2023-04-29 10:58:58,621] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 217 +51: [2023-04-29 10:58:58,620] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 409 +10: [2023-04-29 10:58:58,621] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 84 +31: [2023-04-29 10:58:58,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt. +31: [2023-04-29 10:58:58,622] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 249 +32: [2023-04-29 10:58:58,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt. +32: [2023-04-29 10:58:58,624] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 261 + 8: [2023-04-29 10:58:58,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. +25: [2023-04-29 10:58:58,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt. +25: [2023-04-29 10:58:58,625] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 207 + 8: [2023-04-29 10:58:58,625] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 70 + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 + 4: [2023-04-29 10:58:58,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. + 4: [2023-04-29 10:58:58,627] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 34 +27: [2023-04-29 10:58:58,627] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 217 +31: [2023-04-29 10:58:58,628] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 249 +58: [2023-04-29 10:58:58,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt. +58: [2023-04-29 10:58:58,628] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 465 +10: [2023-04-29 10:58:58,629] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 84 +32: [2023-04-29 10:58:58,631] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 261 +25: [2023-04-29 10:58:58,631] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 207 + 8: [2023-04-29 10:58:58,633] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 70 +52: [2023-04-29 10:58:58,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt. +52: [2023-04-29 10:58:58,634] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 417 + 4: [2023-04-29 10:58:58,634] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 34 +58: [2023-04-29 10:58:58,635] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 465 +52: [2023-04-29 10:58:58,643] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 417 +12: [2023-04-29 10:58:58,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. +12: [2023-04-29 10:58:58,644] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 102 +36: [2023-04-29 10:58:58,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt. +36: [2023-04-29 10:58:58,647] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 291 +51: [2023-04-29 10:58:58,649] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 409 +12: [2023-04-29 10:58:58,652] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 102 +49: [2023-04-29 10:58:58,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt. +49: [2023-04-29 10:58:58,652] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 395 +36: [2023-04-29 10:58:58,653] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 291 +49: [2023-04-29 10:58:58,659] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 395 +33: [2023-04-29 10:58:58,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt. +33: [2023-04-29 10:58:58,663] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 267 +33: [2023-04-29 10:58:58,671] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 267 +57: [2023-04-29 10:58:58,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt. +57: [2023-04-29 10:58:58,672] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 457 +11: [2023-04-29 10:58:58,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. +11: [2023-04-29 10:58:58,674] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 88 +17: [2023-04-29 10:58:58,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +17: [2023-04-29 10:58:58,679] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 140 +57: [2023-04-29 10:58:58,679] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 457 +11: [2023-04-29 10:58:58,681] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 88 + 5: [2023-04-29 10:58:58,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. + 5: [2023-04-29 10:58:58,683] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 40 + 8: [2023-04-29 10:58:58,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt. + 8: [2023-04-29 10:58:58,684] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 67 +39: [2023-04-29 10:58:58,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt. +39: [2023-04-29 10:58:58,685] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 319 +17: [2023-04-29 10:58:58,686] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 140 +13: [2023-04-29 10:58:58,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt. +13: [2023-04-29 10:58:58,688] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 107 + 9: [2023-04-29 10:58:58,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:58,690] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 77 +42: [2023-04-29 10:58:58,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt. + 5: [2023-04-29 10:58:58,690] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 40 +42: [2023-04-29 10:58:58,690] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 343 + 8: [2023-04-29 10:58:58,693] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 67 +39: [2023-04-29 10:58:58,693] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 319 +56: [2023-04-29 10:58:58,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt. +56: [2023-04-29 10:58:58,694] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 453 + 7: [2023-04-29 10:58:58,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. +11: [2023-04-29 10:58:58,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt. + 7: [2023-04-29 10:58:58,695] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 56 +11: [2023-04-29 10:58:58,695] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 93 +34: [2023-04-29 10:58:58,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt. +57: [2023-04-29 10:58:58,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt. +45: [2023-04-29 10:58:58,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt. +57: [2023-04-29 10:58:58,695] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 463 +45: [2023-04-29 10:58:58,695] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 367 +34: [2023-04-29 10:58:58,695] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 279 +13: [2023-04-29 10:58:58,696] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 107 + 5: [2023-04-29 10:58:58,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:58,697] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 77 + 5: [2023-04-29 10:58:58,698] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 41 +47: [2023-04-29 10:58:58,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt. +47: [2023-04-29 10:58:58,699] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 381 +42: [2023-04-29 10:58:58,699] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 343 + 6: [2023-04-29 10:58:58,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 6: [2023-04-29 10:58:58,700] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 52 + 7: [2023-04-29 10:58:58,701] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 56 +38: [2023-04-29 10:58:58,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt. +11: [2023-04-29 10:58:58,702] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 93 +38: [2023-04-29 10:58:58,702] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 305 +56: [2023-04-29 10:58:58,702] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 453 +45: [2023-04-29 10:58:58,703] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 367 + 5: [2023-04-29 10:58:58,704] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 41 +57: [2023-04-29 10:58:58,704] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 463 +47: [2023-04-29 10:58:58,705] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 381 +34: [2023-04-29 10:58:58,705] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 279 + 6: [2023-04-29 10:58:58,710] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 52 +38: [2023-04-29 10:58:58,710] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 305 +63: [2023-04-29 10:58:58,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt. +63: [2023-04-29 10:58:58,713] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 509 +63: [2023-04-29 10:58:58,722] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 509 +58: [2023-04-29 10:58:58,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt. +58: [2023-04-29 10:58:58,722] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 471 +63: [2023-04-29 10:58:58,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt. +63: [2023-04-29 10:58:58,726] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 511 +24: [2023-04-29 10:58:58,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +24: [2023-04-29 10:58:58,729] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 196 +58: [2023-04-29 10:58:58,729] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 471 +13: [2023-04-29 10:58:58,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt. +13: [2023-04-29 10:58:58,733] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 109 +23: [2023-04-29 10:58:58,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt. +23: [2023-04-29 10:58:58,734] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 187 +63: [2023-04-29 10:58:58,735] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 511 +24: [2023-04-29 10:58:58,736] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 196 + 7: [2023-04-29 10:58:58,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. + 7: [2023-04-29 10:58:58,736] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 58 + 9: [2023-04-29 10:58:58,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. + 9: [2023-04-29 10:58:58,737] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 76 +20: [2023-04-29 10:58:58,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. +20: [2023-04-29 10:58:58,739] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 160 +16: [2023-04-29 10:58:58,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt. +13: [2023-04-29 10:58:58,740] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 109 +16: [2023-04-29 10:58:58,740] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 131 +23: [2023-04-29 10:58:58,740] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 187 +60: [2023-04-29 10:58:58,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt. +60: [2023-04-29 10:58:58,740] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 487 +56: [2023-04-29 10:58:58,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt. +56: [2023-04-29 10:58:58,741] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 449 + 9: [2023-04-29 10:58:58,743] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 76 + 7: [2023-04-29 10:58:58,744] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 58 +20: [2023-04-29 10:58:58,747] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 160 +16: [2023-04-29 10:58:58,747] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 131 +56: [2023-04-29 10:58:58,748] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 449 +60: [2023-04-29 10:58:58,750] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 487 +59: [2023-04-29 10:58:58,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt. +59: [2023-04-29 10:58:58,754] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 475 +25: [2023-04-29 10:58:58,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt. +25: [2023-04-29 10:58:58,756] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 203 +59: [2023-04-29 10:58:58,761] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 475 + 3: [2023-04-29 10:58:58,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 3: [2023-04-29 10:58:58,764] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 24 +25: [2023-04-29 10:58:58,764] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 203 +17: [2023-04-29 10:58:58,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt. +17: [2023-04-29 10:58:58,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 139 +46: [2023-04-29 10:58:58,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt. +46: [2023-04-29 10:58:58,769] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 371 +37: [2023-04-29 10:58:58,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt. +37: [2023-04-29 10:58:58,769] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 297 + 3: [2023-04-29 10:58:58,770] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 24 +17: [2023-04-29 10:58:58,774] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 139 +46: [2023-04-29 10:58:58,776] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 371 +47: [2023-04-29 10:58:58,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt. +47: [2023-04-29 10:58:58,777] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 379 +37: [2023-04-29 10:58:58,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 297 +47: [2023-04-29 10:58:58,783] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 379 +30: [2023-04-29 10:58:58,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +30: [2023-04-29 10:58:58,787] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 242 +27: [2023-04-29 10:58:58,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt. +22: [2023-04-29 10:58:58,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt. +22: [2023-04-29 10:58:58,790] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 181 +27: [2023-04-29 10:58:58,790] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 221 +30: [2023-04-29 10:58:58,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 242 +52: [2023-04-29 10:58:58,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt. +52: [2023-04-29 10:58:58,796] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 421 + 6: [2023-04-29 10:58:58,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. + 6: [2023-04-29 10:58:58,797] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 50 +22: [2023-04-29 10:58:58,797] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 181 +27: [2023-04-29 10:58:58,798] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 221 +52: [2023-04-29 10:58:58,802] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 421 + 6: [2023-04-29 10:58:58,804] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 50 +29: [2023-04-29 10:58:58,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +29: [2023-04-29 10:58:58,807] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 232 +40: [2023-04-29 10:58:58,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt. +40: [2023-04-29 10:58:58,813] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 325 +14: [2023-04-29 10:58:58,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +48: [2023-04-29 10:58:58,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt. +14: [2023-04-29 10:58:58,814] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 116 +48: [2023-04-29 10:58:58,814] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 385 +29: [2023-04-29 10:58:58,815] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 232 +11: [2023-04-29 10:58:58,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. +11: [2023-04-29 10:58:58,815] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 94 +53: [2023-04-29 10:58:58,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt. +53: [2023-04-29 10:58:58,816] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 427 +59: [2023-04-29 10:58:58,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt. +59: [2023-04-29 10:58:58,817] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 477 +50: [2023-04-29 10:58:58,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt. +50: [2023-04-29 10:58:58,818] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 403 +15: [2023-04-29 10:58:58,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt. +15: [2023-04-29 10:58:58,820] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 121 +40: [2023-04-29 10:58:58,820] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 325 +48: [2023-04-29 10:58:58,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 385 +14: [2023-04-29 10:58:58,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 116 +11: [2023-04-29 10:58:58,822] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 94 +53: [2023-04-29 10:58:58,824] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 427 +59: [2023-04-29 10:58:58,824] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 477 +48: [2023-04-29 10:58:58,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt. +48: [2023-04-29 10:58:58,827] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 387 +15: [2023-04-29 10:58:58,828] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 121 +50: [2023-04-29 10:58:58,829] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 403 +54: [2023-04-29 10:58:58,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt. +54: [2023-04-29 10:58:58,832] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 439 +23: [2023-04-29 10:58:58,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt. +23: [2023-04-29 10:58:58,833] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 185 +29: [2023-04-29 10:58:58,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +29: [2023-04-29 10:58:58,833] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 234 +48: [2023-04-29 10:58:58,834] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 387 +22: [2023-04-29 10:58:58,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt. +22: [2023-04-29 10:58:58,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 183 +22: [2023-04-29 10:58:58,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt. +22: [2023-04-29 10:58:58,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 177 +54: [2023-04-29 10:58:58,840] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 439 +29: [2023-04-29 10:58:58,840] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 234 +23: [2023-04-29 10:58:58,840] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 185 +29: [2023-04-29 10:58:58,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +29: [2023-04-29 10:58:58,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 238 + 2: [2023-04-29 10:58:58,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt. + 2: [2023-04-29 10:58:58,844] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 19 +22: [2023-04-29 10:58:58,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 183 +22: [2023-04-29 10:58:58,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 177 +29: [2023-04-29 10:58:58,847] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 238 + 2: [2023-04-29 10:58:58,850] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 19 +11: [2023-04-29 10:58:58,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. +11: [2023-04-29 10:58:58,852] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 92 +23: [2023-04-29 10:58:58,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. +23: [2023-04-29 10:58:58,852] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 190 +15: [2023-04-29 10:58:58,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt. +15: [2023-04-29 10:58:58,856] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 125 +11: [2023-04-29 10:58:58,859] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 92 +23: [2023-04-29 10:58:58,859] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 190 +15: [2023-04-29 10:58:58,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +15: [2023-04-29 10:58:58,861] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 126 +55: [2023-04-29 10:58:58,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt. +55: [2023-04-29 10:58:58,864] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 445 +15: [2023-04-29 10:58:58,864] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 125 +18: [2023-04-29 10:58:58,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. +18: [2023-04-29 10:58:58,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 146 +15: [2023-04-29 10:58:58,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 126 +16: [2023-04-29 10:58:58,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt. + 1: [2023-04-29 10:58:58,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:58,870] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 135 + 1: [2023-04-29 10:58:58,870] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 10 +16: [2023-04-29 10:58:58,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:58,872] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 130 +55: [2023-04-29 10:58:58,872] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 445 +18: [2023-04-29 10:58:58,874] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 146 + 1: [2023-04-29 10:58:58,876] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 10 + 1: [2023-04-29 10:58:58,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt. +16: [2023-04-29 10:58:58,877] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 135 + 1: [2023-04-29 10:58:58,877] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 9 +16: [2023-04-29 10:58:58,879] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 130 +19: [2023-04-29 10:58:58,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. +19: [2023-04-29 10:58:58,880] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 152 + 1: [2023-04-29 10:58:58,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 9 +24: [2023-04-29 10:58:58,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +24: [2023-04-29 10:58:58,885] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 198 +19: [2023-04-29 10:58:58,887] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 152 +30: [2023-04-29 10:58:58,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt. +30: [2023-04-29 10:58:58,889] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 247 + 3: [2023-04-29 10:58:58,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt. +24: [2023-04-29 10:58:58,891] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 198 + 3: [2023-04-29 10:58:58,892] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 31 +30: [2023-04-29 10:58:58,897] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 247 + 3: [2023-04-29 10:58:58,898] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 31 +56: [2023-04-29 10:58:58,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt. +56: [2023-04-29 10:58:58,901] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 455 +17: [2023-04-29 10:58:58,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt. +17: [2023-04-29 10:58:58,901] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 137 +16: [2023-04-29 10:58:58,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. +16: [2023-04-29 10:58:58,903] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 128 + 3: [2023-04-29 10:58:58,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt. + 3: [2023-04-29 10:58:58,904] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 25 +40: [2023-04-29 10:58:58,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt. +40: [2023-04-29 10:58:58,905] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 321 +28: [2023-04-29 10:58:58,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +28: [2023-04-29 10:58:58,907] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 224 +56: [2023-04-29 10:58:58,909] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 455 +17: [2023-04-29 10:58:58,909] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 137 +16: [2023-04-29 10:58:58,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 128 + 3: [2023-04-29 10:58:58,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 25 + 8: [2023-04-29 10:58:58,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt. +40: [2023-04-29 10:58:58,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 321 + 8: [2023-04-29 10:58:58,912] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 65 +28: [2023-04-29 10:58:58,914] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 224 + 8: [2023-04-29 10:58:58,919] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 65 +10: [2023-04-29 10:58:58,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +10: [2023-04-29 10:58:58,921] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 86 +45: [2023-04-29 10:58:58,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt. +45: [2023-04-29 10:58:58,922] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 365 +54: [2023-04-29 10:58:58,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt. +54: [2023-04-29 10:58:58,924] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 433 +10: [2023-04-29 10:58:58,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 86 +38: [2023-04-29 10:58:58,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt. +47: [2023-04-29 10:58:58,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt. +45: [2023-04-29 10:58:58,929] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 365 +47: [2023-04-29 10:58:58,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 377 +38: [2023-04-29 10:58:58,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 311 +10: [2023-04-29 10:58:58,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt. +10: [2023-04-29 10:58:58,931] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 83 +54: [2023-04-29 10:58:58,931] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 433 +10: [2023-04-29 10:58:58,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt. +10: [2023-04-29 10:58:58,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 81 +25: [2023-04-29 10:58:58,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt. +25: [2023-04-29 10:58:58,934] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 205 +20: [2023-04-29 10:58:58,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +20: [2023-04-29 10:58:58,934] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 162 +38: [2023-04-29 10:58:58,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 311 +47: [2023-04-29 10:58:58,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 377 +10: [2023-04-29 10:58:58,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt. +10: [2023-04-29 10:58:58,936] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 87 +10: [2023-04-29 10:58:58,937] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 83 +37: [2023-04-29 10:58:58,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt. +37: [2023-04-29 10:58:58,938] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 303 +10: [2023-04-29 10:58:58,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 81 +41: [2023-04-29 10:58:58,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt. +41: [2023-04-29 10:58:58,941] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 329 +20: [2023-04-29 10:58:58,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 162 + 7: [2023-04-29 10:58:58,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt. + 7: [2023-04-29 10:58:58,941] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 63 +25: [2023-04-29 10:58:58,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 205 +10: [2023-04-29 10:58:58,942] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 87 +28: [2023-04-29 10:58:58,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +28: [2023-04-29 10:58:58,944] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 226 +37: [2023-04-29 10:58:58,945] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 303 +41: [2023-04-29 10:58:58,948] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 329 + 7: [2023-04-29 10:58:58,948] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 63 +28: [2023-04-29 10:58:58,951] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 226 +21: [2023-04-29 10:58:58,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt. +21: [2023-04-29 10:58:58,956] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 169 + 7: [2023-04-29 10:58:58,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. + 7: [2023-04-29 10:58:58,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 60 +21: [2023-04-29 10:58:58,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 169 +30: [2023-04-29 10:58:58,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt. +30: [2023-04-29 10:58:58,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 243 +18: [2023-04-29 10:58:58,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt. +18: [2023-04-29 10:58:58,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 149 + 7: [2023-04-29 10:58:58,966] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 60 +27: [2023-04-29 10:58:58,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +27: [2023-04-29 10:58:58,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 216 +15: [2023-04-29 10:58:58,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt. +15: [2023-04-29 10:58:58,968] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 127 + 7: [2023-04-29 10:58:58,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. + 7: [2023-04-29 10:58:58,969] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 62 +18: [2023-04-29 10:58:58,971] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 149 +24: [2023-04-29 10:58:58,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt. +24: [2023-04-29 10:58:58,972] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 195 +30: [2023-04-29 10:58:58,972] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 243 +27: [2023-04-29 10:58:58,974] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 216 + 7: [2023-04-29 10:58:58,976] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 62 +15: [2023-04-29 10:58:58,978] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 127 +24: [2023-04-29 10:58:58,980] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 195 +53: [2023-04-29 10:58:58,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt. +53: [2023-04-29 10:58:58,980] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 431 +18: [2023-04-29 10:58:58,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. +18: [2023-04-29 10:58:58,983] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 144 +53: [2023-04-29 10:58:58,986] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 431 + 6: [2023-04-29 10:58:58,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt. + 6: [2023-04-29 10:58:58,987] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 51 + 9: [2023-04-29 10:58:58,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:58,989] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 79 +18: [2023-04-29 10:58:58,991] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 144 + 8: [2023-04-29 10:58:58,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt. + 8: [2023-04-29 10:58:58,992] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 71 + 8: [2023-04-29 10:58:58,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt. + 8: [2023-04-29 10:58:58,994] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 69 + 6: [2023-04-29 10:58:58,994] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 51 + 0: [2023-04-29 10:58:58,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. + 0: [2023-04-29 10:58:58,995] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 4 + 9: [2023-04-29 10:58:58,996] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 79 +14: [2023-04-29 10:58:59,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt. +22: [2023-04-29 10:58:59,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt. +14: [2023-04-29 10:58:59,000] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 117 +22: [2023-04-29 10:58:59,000] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 179 + 8: [2023-04-29 10:58:59,003] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 71 + 8: [2023-04-29 10:58:59,003] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 69 +50: [2023-04-29 10:58:59,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt. +50: [2023-04-29 10:58:59,005] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 407 +44: [2023-04-29 10:58:59,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt. +44: [2023-04-29 10:58:59,005] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 353 + 0: [2023-04-29 10:58:59,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 4 +14: [2023-04-29 10:58:59,007] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 117 +10: [2023-04-29 10:58:59,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt. +10: [2023-04-29 10:58:59,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 85 +22: [2023-04-29 10:58:59,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 179 +29: [2023-04-29 10:58:59,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt. +29: [2023-04-29 10:58:59,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 233 +50: [2023-04-29 10:58:59,012] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 407 +44: [2023-04-29 10:58:59,014] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 353 +10: [2023-04-29 10:58:59,014] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 85 +29: [2023-04-29 10:58:59,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 233 +48: [2023-04-29 10:58:59,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt. +48: [2023-04-29 10:58:59,019] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 389 +13: [2023-04-29 10:58:59,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +13: [2023-04-29 10:58:59,027] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 106 +48: [2023-04-29 10:58:59,028] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 389 +11: [2023-04-29 10:58:59,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +11: [2023-04-29 10:58:59,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 90 +26: [2023-04-29 10:58:59,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt. +13: [2023-04-29 10:58:59,035] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 106 +26: [2023-04-29 10:58:59,035] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 215 +11: [2023-04-29 10:58:59,037] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 90 +36: [2023-04-29 10:58:59,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt. +37: [2023-04-29 10:58:59,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt. +36: [2023-04-29 10:58:59,037] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 293 +37: [2023-04-29 10:58:59,038] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 299 +26: [2023-04-29 10:58:59,042] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 215 +46: [2023-04-29 10:58:59,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt. +46: [2023-04-29 10:58:59,043] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 375 +37: [2023-04-29 10:58:59,044] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 299 +26: [2023-04-29 10:58:59,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt. +26: [2023-04-29 10:58:59,045] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 209 +36: [2023-04-29 10:58:59,047] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 293 +46: [2023-04-29 10:58:59,050] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 375 +15: [2023-04-29 10:58:59,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt. +15: [2023-04-29 10:58:59,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 123 +23: [2023-04-29 10:58:59,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt. +23: [2023-04-29 10:58:59,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 189 +45: [2023-04-29 10:58:59,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt. +45: [2023-04-29 10:58:59,052] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 361 +18: [2023-04-29 10:58:59,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt. +18: [2023-04-29 10:58:59,052] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 147 +26: [2023-04-29 10:58:59,053] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 209 +29: [2023-04-29 10:58:59,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt. +29: [2023-04-29 10:58:59,055] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 239 +20: [2023-04-29 10:58:59,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +20: [2023-04-29 10:58:59,057] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 166 +11: [2023-04-29 10:58:59,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt. +11: [2023-04-29 10:58:59,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 91 +19: [2023-04-29 10:58:59,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt. +19: [2023-04-29 10:58:59,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 153 + 4: [2023-04-29 10:58:59,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. +23: [2023-04-29 10:58:59,059] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 189 + 4: [2023-04-29 10:58:59,059] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 38 +15: [2023-04-29 10:58:59,060] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 123 +18: [2023-04-29 10:58:59,060] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 147 +45: [2023-04-29 10:58:59,061] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 361 +29: [2023-04-29 10:58:59,061] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 239 +12: [2023-04-29 10:58:59,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt. +12: [2023-04-29 10:58:59,063] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 101 +20: [2023-04-29 10:58:59,065] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 166 +19: [2023-04-29 10:58:59,065] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 153 +51: [2023-04-29 10:58:59,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt. +51: [2023-04-29 10:58:59,066] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 411 +11: [2023-04-29 10:58:59,066] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 91 + 4: [2023-04-29 10:58:59,067] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 38 +27: [2023-04-29 10:58:59,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +27: [2023-04-29 10:58:59,068] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 220 + 1: [2023-04-29 10:58:59,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 1: [2023-04-29 10:58:59,069] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 14 +53: [2023-04-29 10:58:59,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt. +53: [2023-04-29 10:58:59,070] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 429 +12: [2023-04-29 10:58:59,070] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 101 +14: [2023-04-29 10:58:59,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt. +14: [2023-04-29 10:58:59,072] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 113 +51: [2023-04-29 10:58:59,073] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 411 + 1: [2023-04-29 10:58:59,076] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 14 +22: [2023-04-29 10:58:59,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +22: [2023-04-29 10:58:59,076] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 180 +27: [2023-04-29 10:58:59,076] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 220 +53: [2023-04-29 10:58:59,077] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 429 +14: [2023-04-29 10:58:59,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. +14: [2023-04-29 10:58:59,078] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 118 +14: [2023-04-29 10:58:59,080] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 113 +12: [2023-04-29 10:58:59,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt. +12: [2023-04-29 10:58:59,081] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 97 +22: [2023-04-29 10:58:59,083] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 180 +14: [2023-04-29 10:58:59,085] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 118 + 0: [2023-04-29 10:58:59,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt. +12: [2023-04-29 10:58:59,089] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 97 +19: [2023-04-29 10:58:59,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt. + 0: [2023-04-29 10:58:59,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 7 +19: [2023-04-29 10:58:59,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 159 +11: [2023-04-29 10:58:59,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt. +11: [2023-04-29 10:58:59,090] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 95 +43: [2023-04-29 10:58:59,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt. +43: [2023-04-29 10:58:59,092] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 351 +55: [2023-04-29 10:58:59,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt. +55: [2023-04-29 10:58:59,095] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 447 + 0: [2023-04-29 10:58:59,096] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 7 +11: [2023-04-29 10:58:59,096] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 95 +43: [2023-04-29 10:58:59,098] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 351 +19: [2023-04-29 10:58:59,099] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 159 +31: [2023-04-29 10:58:59,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt. +31: [2023-04-29 10:58:59,101] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 251 +57: [2023-04-29 10:58:59,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt. +57: [2023-04-29 10:58:59,104] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 461 +55: [2023-04-29 10:58:59,104] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 447 +31: [2023-04-29 10:58:59,108] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 251 +26: [2023-04-29 10:58:59,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +26: [2023-04-29 10:58:59,109] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 210 +57: [2023-04-29 10:58:59,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt. +57: [2023-04-29 10:58:59,112] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 459 +57: [2023-04-29 10:58:59,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 461 +26: [2023-04-29 10:58:59,116] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 210 + 2: [2023-04-29 10:58:59,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt. + 2: [2023-04-29 10:58:59,119] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 21 +57: [2023-04-29 10:58:59,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 459 + 2: [2023-04-29 10:58:59,127] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 21 + 9: [2023-04-29 10:58:59,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:59,130] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 73 +59: [2023-04-29 10:58:59,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt. +59: [2023-04-29 10:58:59,130] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 479 +24: [2023-04-29 10:58:59,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt. +24: [2023-04-29 10:58:59,133] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 199 + 7: [2023-04-29 10:58:59,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt. + 7: [2023-04-29 10:58:59,134] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 57 +24: [2023-04-29 10:58:59,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt. +24: [2023-04-29 10:58:59,136] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 193 +13: [2023-04-29 10:58:59,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:59,137] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 73 +13: [2023-04-29 10:58:59,137] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 105 + 6: [2023-04-29 10:58:59,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt. + 6: [2023-04-29 10:58:59,138] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 49 +59: [2023-04-29 10:58:59,138] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 479 +24: [2023-04-29 10:58:59,139] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 199 + 7: [2023-04-29 10:58:59,141] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 57 +24: [2023-04-29 10:58:59,143] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 193 + 6: [2023-04-29 10:58:59,144] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 49 +13: [2023-04-29 10:58:59,145] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 105 +13: [2023-04-29 10:58:59,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt. +13: [2023-04-29 10:58:59,145] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 111 +49: [2023-04-29 10:58:59,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt. +49: [2023-04-29 10:58:59,146] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 393 +11: [2023-04-29 10:58:59,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt. +11: [2023-04-29 10:58:59,152] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 89 +13: [2023-04-29 10:58:59,152] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 111 +49: [2023-04-29 10:58:59,153] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 393 +18: [2023-04-29 10:58:59,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt. +18: [2023-04-29 10:58:59,154] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 151 +11: [2023-04-29 10:58:59,158] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 89 +40: [2023-04-29 10:58:59,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt. +40: [2023-04-29 10:58:59,161] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 327 +21: [2023-04-29 10:58:59,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +21: [2023-04-29 10:58:59,163] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 174 +18: [2023-04-29 10:58:59,163] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 151 +20: [2023-04-29 10:58:59,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +20: [2023-04-29 10:58:59,164] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 164 +21: [2023-04-29 10:58:59,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt. +21: [2023-04-29 10:58:59,167] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 173 + 9: [2023-04-29 10:58:59,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt. + 9: [2023-04-29 10:58:59,168] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 75 +40: [2023-04-29 10:58:59,169] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 327 +21: [2023-04-29 10:58:59,169] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 174 +20: [2023-04-29 10:58:59,171] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 164 +51: [2023-04-29 10:58:59,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt. +51: [2023-04-29 10:58:59,173] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 413 +21: [2023-04-29 10:58:59,174] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 173 + 9: [2023-04-29 10:58:59,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 75 +27: [2023-04-29 10:58:59,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt. +27: [2023-04-29 10:58:59,179] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 219 +51: [2023-04-29 10:58:59,181] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 413 + 4: [2023-04-29 10:58:59,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt. + 4: [2023-04-29 10:58:59,184] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 37 +27: [2023-04-29 10:58:59,186] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 219 +58: [2023-04-29 10:58:59,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt. +58: [2023-04-29 10:58:59,189] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 467 + 4: [2023-04-29 10:58:59,192] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 37 +28: [2023-04-29 10:58:59,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt. +28: [2023-04-29 10:58:59,192] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 225 +58: [2023-04-29 10:58:59,195] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 467 +28: [2023-04-29 10:58:59,199] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 225 + 6: [2023-04-29 10:58:59,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt. + 6: [2023-04-29 10:58:59,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 55 +28: [2023-04-29 10:58:59,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt. +28: [2023-04-29 10:58:59,201] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 229 +10: [2023-04-29 10:58:59,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. +10: [2023-04-29 10:58:59,203] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 80 +29: [2023-04-29 10:58:59,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt. +29: [2023-04-29 10:58:59,206] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 237 +28: [2023-04-29 10:58:59,207] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 229 + 6: [2023-04-29 10:58:59,209] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 55 +10: [2023-04-29 10:58:59,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 80 + 2: [2023-04-29 10:58:59,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt. + 2: [2023-04-29 10:58:59,214] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 17 +29: [2023-04-29 10:58:59,215] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 237 + 0: [2023-04-29 10:58:59,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt. + 0: [2023-04-29 10:58:59,216] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 1 + 2: [2023-04-29 10:58:59,222] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 17 +17: [2023-04-29 10:58:59,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt. +17: [2023-04-29 10:58:59,223] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 141 + 0: [2023-04-29 10:58:59,224] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 1 +17: [2023-04-29 10:58:59,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 141 +33: [2023-04-29 10:58:59,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt. +33: [2023-04-29 10:58:59,231] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 269 +14: [2023-04-29 10:58:59,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. +14: [2023-04-29 10:58:59,237] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 114 +20: [2023-04-29 10:58:59,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt. +20: [2023-04-29 10:58:59,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 165 +14: [2023-04-29 10:58:59,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +14: [2023-04-29 10:58:59,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 112 +33: [2023-04-29 10:58:59,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 269 +14: [2023-04-29 10:58:59,245] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 114 +20: [2023-04-29 10:58:59,247] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 165 +14: [2023-04-29 10:58:59,248] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 112 +51: [2023-04-29 10:58:59,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt. +51: [2023-04-29 10:58:59,254] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 415 + 0: [2023-04-29 10:58:59,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt. + 0: [2023-04-29 10:58:59,258] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 5 +47: [2023-04-29 10:58:59,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt. +47: [2023-04-29 10:58:59,259] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 383 +12: [2023-04-29 10:58:59,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt. +12: [2023-04-29 10:58:59,260] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 99 +28: [2023-04-29 10:58:59,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt. +28: [2023-04-29 10:58:59,260] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 231 +51: [2023-04-29 10:58:59,261] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 415 +47: [2023-04-29 10:58:59,265] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 383 + 0: [2023-04-29 10:58:59,267] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 5 +27: [2023-04-29 10:58:59,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt. +27: [2023-04-29 10:58:59,267] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 223 +12: [2023-04-29 10:58:59,268] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 99 +28: [2023-04-29 10:58:59,268] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 231 +27: [2023-04-29 10:58:59,274] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 223 +31: [2023-04-29 10:58:59,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt. +31: [2023-04-29 10:58:59,280] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 255 +23: [2023-04-29 10:58:59,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt. +23: [2023-04-29 10:58:59,282] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 191 +31: [2023-04-29 10:58:59,286] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 255 +30: [2023-04-29 10:58:59,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt. +30: [2023-04-29 10:58:59,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 245 +18: [2023-04-29 10:58:59,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt. +18: [2023-04-29 10:58:59,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 145 +18: [2023-04-29 10:58:59,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. +18: [2023-04-29 10:58:59,290] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 150 +23: [2023-04-29 10:58:59,290] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 191 +30: [2023-04-29 10:58:59,294] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 245 + 4: [2023-04-29 10:58:59,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt. + 4: [2023-04-29 10:58:59,295] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 39 +18: [2023-04-29 10:58:59,296] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 145 +18: [2023-04-29 10:58:59,297] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 150 + 7: [2023-04-29 10:58:59,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt. + 7: [2023-04-29 10:58:59,298] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 61 + 4: [2023-04-29 10:58:59,302] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 39 + 7: [2023-04-29 10:58:59,304] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 61 +12: [2023-04-29 10:58:59,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt. +12: [2023-04-29 10:58:59,313] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 103 +58: [2023-04-29 10:58:59,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt. +58: [2023-04-29 10:58:59,315] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 469 +15: [2023-04-29 10:58:59,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. +15: [2023-04-29 10:58:59,317] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 122 +12: [2023-04-29 10:58:59,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 103 +58: [2023-04-29 10:58:59,322] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 469 +20: [2023-04-29 10:58:59,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt. +15: [2023-04-29 10:58:59,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 122 +20: [2023-04-29 10:58:59,324] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 161 +20: [2023-04-29 10:58:59,331] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 161 +43: [2023-04-29 10:58:59,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt. +43: [2023-04-29 10:58:59,341] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 347 +43: [2023-04-29 10:58:59,347] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 347 +21: [2023-04-29 10:58:59,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt. +21: [2023-04-29 10:58:59,348] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 175 +25: [2023-04-29 10:58:59,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt. +25: [2023-04-29 10:58:59,355] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 201 +21: [2023-04-29 10:58:59,355] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 175 +25: [2023-04-29 10:58:59,361] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 201 +37: [2023-04-29 10:58:59,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt. +37: [2023-04-29 10:58:59,368] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 301 + 7: [2023-04-29 10:58:59,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt. + 7: [2023-04-29 10:58:59,369] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 59 +37: [2023-04-29 10:58:59,374] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 301 + 7: [2023-04-29 10:58:59,377] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 59 +26: [2023-04-29 10:58:59,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt. +26: [2023-04-29 10:58:59,379] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 211 +28: [2023-04-29 10:58:59,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt. +28: [2023-04-29 10:58:59,382] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 227 +26: [2023-04-29 10:58:59,387] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 211 +28: [2023-04-29 10:58:59,389] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 227 +19: [2023-04-29 10:58:59,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt. +19: [2023-04-29 10:58:59,393] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 155 +19: [2023-04-29 10:58:59,400] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 155 +26: [2023-04-29 10:58:59,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt. +26: [2023-04-29 10:58:59,401] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 213 + 6: [2023-04-29 10:58:59,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt. + 6: [2023-04-29 10:58:59,402] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 53 +26: [2023-04-29 10:58:59,409] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 213 + 6: [2023-04-29 10:58:59,411] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 53 +14: [2023-04-29 10:58:59,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt. +14: [2023-04-29 10:58:59,428] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 115 +14: [2023-04-29 10:58:59,436] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 115 + 4: [2023-04-29 10:58:59,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt. + 4: [2023-04-29 10:58:59,441] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 35 + 4: [2023-04-29 10:58:59,448] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 35 +16: [2023-04-29 10:58:59,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt. +16: [2023-04-29 10:58:59,455] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 133 + 5: [2023-04-29 10:58:59,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt. + 5: [2023-04-29 10:58:59,459] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 43 + 1: [2023-04-29 10:58:59,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt. + 1: [2023-04-29 10:58:59,462] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 11 +16: [2023-04-29 10:58:59,463] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 133 + 5: [2023-04-29 10:58:59,466] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 43 + 1: [2023-04-29 10:58:59,469] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 11 +14: [2023-04-29 10:58:59,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt. +14: [2023-04-29 10:58:59,478] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 119 +14: [2023-04-29 10:58:59,485] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 119 + 4: [2023-04-29 10:58:59,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt. + 4: [2023-04-29 10:58:59,492] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 33 + 4: [2023-04-29 10:58:59,498] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 33 +16: [2023-04-29 10:58:59,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt. +16: [2023-04-29 10:58:59,500] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 129 +30: [2023-04-29 10:58:59,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt. +30: [2023-04-29 10:58:59,505] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 241 +16: [2023-04-29 10:58:59,508] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 129 +30: [2023-04-29 10:58:59,512] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 241 + 2: [2023-04-29 10:58:59,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt. + 2: [2023-04-29 10:58:59,525] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 23 +21: [2023-04-29 10:58:59,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt. +21: [2023-04-29 10:58:59,528] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 171 +20: [2023-04-29 10:58:59,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt. +20: [2023-04-29 10:58:59,530] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 163 + 2: [2023-04-29 10:58:59,534] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 23 +21: [2023-04-29 10:58:59,534] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 171 +20: [2023-04-29 10:58:59,537] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 163 +20: [2023-04-29 10:58:59,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt. +20: [2023-04-29 10:58:59,611] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 167 +20: [2023-04-29 10:58:59,618] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 167 +29: [2023-04-29 10:58:59,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt. +29: [2023-04-29 10:58:59,632] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 235 + 0: [2023-04-29 10:58:59,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt. + 0: [2023-04-29 10:58:59,637] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 3 +29: [2023-04-29 10:58:59,641] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 235 + 0: [2023-04-29 10:58:59,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 3 + 0: successfully loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b44b at iteration 0 +63: time (ms) | load-checkpoint: 18107.31 + 0: estimated model parameters: 8.905678848 + 0: estimated model parameters without embeddings: 8.458985472 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-04-29 10:59:01 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 51200 + 0: test: 51200 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.027666 seconds + 0: number of documents: 835726 + 0: > dataset split: + 0: train: + 0: document indices in [0, 835726) total of 835726 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.002 seconds + 0: total number of samples: 195101 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.000804 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.010 seconds + 0: total number of samples: 84978 + 0: total number of epochs: 1 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-04-29 10:59:08 + 0: done with setup ... + 0: training ... +63: time (ms) | model-and-optimizer-setup: 38412.79 | train/valid/test-data-iterators-setup: 4003.16 + 0: [after training is done] datetime: 2023-04-29 10:59:08 +63: ----------------------------------------------------------------------------------------------------------------- +63: validation loss at the end of training for val data | lm loss value: 2.351177E+00 | lm loss PPL: 1.049792E+01 | +63: ----------------------------------------------------------------------------------------------------------------- +END 3430925: Sat 29 Apr 2023 11:00:38 AM EEST